[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9934193562983836, "4": 0.005875938423782536, "3": 0.0006858131112054633, "1": 1.6856958821199286e-05, "2": 0}, "score": 4.992684992630962}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.996703912263216, "4": 0.0030928818041270046, "3": 0.0001566944229272288, "1": 4.479661407869946e-05, "2": 0}, "score": 4.996414536745009}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9973129875976606, "4": 0.002633726804259968, "3": 5.021257824513888e-05, "1": 2.3240899846390372e-06, "2": 0}, "score": 4.99725654962466}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978715157420852, "4": 0.0020704858274318044, "3": 3.5772074888057075e-05, "1": 2.0926338020521403e-05, "2": 0}, "score": 4.997774261777211}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9849841552303388, "5": 0.014981435166122091, "1": 1.962298450405836e-05, "3": 1.032389961102611e-05, "2": 0}, "score": 4.014912308862449}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9443460704169961, "4": 0.045405964768440464, "3": 0.008328390989369291, "1": 0.0018564763935405495, "2": 4.890812597163369e-05}, "score": 4.930363635209076}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9810397699739756, "4": 0.01720939712289687, "3": 0.001635623175755519, "1": 0.00011152385988017047, "2": 2.159985606387272e-06}, "score": 4.979066749187584}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9912393173891031, "4": 0.007803476027541751, "3": 0.0008172416741935829, "1": 0.00013758976740767918, "2": 1.6172651731467694e-06}, "score": 4.990006822185326}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9334401514999197, "4": 0.06044260753319617, "3": 0.005272598309902336, "1": 0.0008247784938360899, "2": 1.2572470692283074e-05}, "score": 4.925674822503242}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9687047646109066, "4": 0.027442062910394815, "3": 0.0022137030000787643, "1": 0.0016218193570345179, "2": 1.0741476517294657e-05}, "score": 4.961610764014151}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9680418782368375, "4": 0.027995432699138883, "3": 0.0033857325005552615, "1": 0.0005596837309143329, "2": 1.366044674150851e-05}, "score": 4.962953252208723}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9834470863234643, "4": 0.014681198756023884, "3": 0.0014289782508346786, "1": 0.00043162258387969605, "2": 7.803517222061046e-06}, "score": 4.980710879997167}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9941139565303493, "4": 0.005119764689852766, "3": 0.000545140390077951, "1": 0.00021758934721375568, "2": 1.6856994102750676e-06}, "score": 4.992914526840238}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903191738343837, "4": 0.009012461934624655, "3": 0.0003923771748630235, "1": 0.0002713416038702757, "2": 0}, "score": 4.989117366745415}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9765936798115311, "4": 0.0219336849125473, "3": 0.0011616835381827134, "1": 0.00030264562238904366, "2": 5.2710340512507285e-06}, "score": 4.974516475074807}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9386720033513156, "4": 0.052891544088134575, "3": 0.007755998771463131, "1": 0.0006624368668271719, "2": 1.6816365648215173e-05}, "score": 4.92889617644052}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7863640781857731, "4": 0.19602395653526855, "3": 0.01737324325967168, "1": 0.0001852411626350417, "2": 5.2262210533530756e-05}, "score": 4.768331523341358}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9332396234258696, "4": 0.05934846629275257, "3": 0.007194352037713605, "1": 0.0002050136491136686, "2": 1.0969597229332355e-05}, "score": 4.925409748764232}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8106861022796819, "4": 0.17243359036968298, "3": 0.015212618972384653, "1": 0.0016382789645892242, "2": 2.758525961027371e-05}, "score": 4.790504917897057}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9127496645155049, "4": 0.07381918660997382, "3": 0.013302494565846722, "1": 0.00011791199698496867, "2": 1.03939359874803e-05}, "score": 4.899072959301902}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"5": 0.95213092251126, "4": 0.038223139526236634, "1": 0.006186865511136469, "3": 0.0034323950368606517, "2": 1.610504469435384e-05}, "score": 4.930115554377211}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9472950324671687, "4": 0.04953771897929785, "3": 0.002128720891644641, "1": 0.0010108389998930484, "2": 0}, "score": 4.942159881722356}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9439257033616619, "4": 0.053040786753699255, "3": 0.002100135526303793, "1": 0.000920647160398514, "2": 0}, "score": 4.939075578154923}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9761988505535744, "4": 0.02318444730258892, "3": 0.0004359334342541822, "1": 0.00017314087300466542, "2": 0}, "score": 4.97525093355505}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9596497200991652, "4": 0.03781242222699257, "3": 0.002045780294829349, "1": 0.00047991459354901274, "2": 0}, "score": 4.956175825785125}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9340943488086189, "4": 0.0608774349013397, "3": 0.0041854920804729485, "1": 0.0007964844115437311, "2": 2.233979367593348e-05}, "score": 4.927496891085894}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9304616110602069, "4": 0.06452742188663109, "3": 0.004790350485431034, "1": 0.00018304033858273412, "2": 0}, "score": 4.925156903466831}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9871453687096704, "4": 0.01220909271910484, "3": 0.0003867439932433146, "1": 0.0002448768810634069, "2": 0}, "score": 4.986037717447338}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912094498159786, "4": 0.00847768721887614, "3": 0.00022107865826937714, "1": 8.521969405158867e-05, "2": 0}, "score": 4.990739215894917}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9835543213390997, "4": 0.015686722893287267, "3": 0.0005138599502328541, "1": 0.0002339027797716295, "2": 0}, "score": 4.9823497485272314}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9957541083936973, "4": 0.004187352526513999, "3": 5.590274910679697e-05, "1": 2.0525903029961495e-06, "2": 0}, "score": 4.995692629099674}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9680898023362512, "4": 0.030326104582526728, "3": 0.0014333857153865232, "1": 0.00014800662821004185, "2": 0}, "score": 4.966215006229457}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987559001347031, "4": 0.0012099942154557468, "3": 2.173818861760274e-05, "1": 1.1715942931488787e-05, "2": 0}, "score": 4.99869966478839}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998380405760584, "4": 0.0015645500567519506, "3": 4.582851785625059e-05, "1": 8.942700008521556e-06, "2": 0}, "score": 4.99830802164565}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9918735237949876, "4": 0.007713949235845758, "3": 0.0003883671122813554, "1": 2.231048077496768e-05, "2": 0}, "score": 4.991420058748953}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9884874890018673, "4": 0.011026351280885943, "3": 0.00041138131494299865, "1": 7.192533434605728e-05, "2": 0}, "score": 4.9878631501245865}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9547213320342598, "4": 0.04077692994579282, "3": 0.003882620370786025, "1": 0.000599374467950975, "2": 1.706464122248117e-05}, "score": 4.9490090009357335}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9792836108224446, "4": 0.02010461677486686, "3": 0.000504224375235895, "1": 9.309733492787042e-05, "2": 0}, "score": 4.978514234650762}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9778851533062393, "4": 0.021024166861421154, "3": 0.0010134360421333402, "1": 6.993292427139814e-05, "2": 0}, "score": 4.976669058787843}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.993300665273652, "4": 0.00648376123180119, "3": 0.00016120527582248227, "1": 5.3114213039770876e-05, "2": 0}, "score": 4.9929813625629835}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"5": 0.984452657422301, "4": 0.013555241227353527, "3": 0.0014580957141284488, "1": 0.000517094455974181, "2": 7.794252148144822e-06}, "score": 4.981436637523208}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9848450449075417, "4": 0.013430876583849411, "3": 0.0008643359791427207, "1": 0.0008467708017415778, "2": 0}, "score": 4.981453127665921}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9721031030989389, "4": 0.024820893516367716, "3": 0.002635047685997003, "1": 0.0004170908475755866, "2": 1.3531124603260228e-05}, "score": 4.968199725732189}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9956875648680704, "4": 0.0041126717534742206, "1": 0.00013860865877995355, "3": 5.11753800482971e-05, "2": 0}, "score": 4.995230495254803}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9890907630719967, "4": 0.010059695330577658, "1": 0.0004566740317593886, "3": 0.000384616816929426, "2": 0}, "score": 4.987344270489281}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9901963095857542, "4": 0.00905439956154988, "3": 0.000696717874714473, "1": 4.894795339373619e-05, "2": 0}, "score": 4.989356334291897}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9726066817970624, "4": 0.02611739269001052, "3": 0.0011926968207188464, "1": 7.868094923613395e-05, "2": 0}, "score": 4.971182358816382}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9899134073522007, "4": 0.009560925949183244, "3": 0.0004924676917556892, "1": 2.9297613376084896e-05, "2": 0}, "score": 4.989336906612878}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939329142473436, "4": 0.005813987655992567, "3": 0.000206246809904252, "1": 4.428768103760277e-05, "2": 0}, "score": 4.993596351583619}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.993129200025036, "4": 0.006409182187771906, "3": 0.0003735013271940467, "1": 8.473506935723073e-05, "2": 0}, "score": 4.992504849536379}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9784339027433883, "4": 0.021014550504991316, "3": 0.0004821691364349001, "1": 6.569767639461301e-05, "2": 0}, "score": 4.9777582386682395}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969007702585505, "4": 0.002976003458147614, "3": 6.477706191927229e-05, "1": 5.627107051987202e-05, "2": 0}, "score": 4.996669350881278}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9684454228196633, "4": 0.02969100027907977, "3": 0.0018236769750966607, "1": 3.784211205239803e-05, "2": 1.4539115687414573e-06}, "score": 4.966505895360637}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9973892313000066, "4": 0.0024685162928088007, "1": 7.996144315765597e-05, "3": 6.140943930610608e-05, "2": 0}, "score": 4.9970888164896685}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962712623714377, "4": 0.0035491150083362235, "3": 9.836318107445622e-05, "1": 7.863701819487074e-05, "2": 0}, "score": 4.995939599908657}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9616956120265118, "4": 0.03621224346745463, "3": 0.0018609568277610574, "1": 0.0002186408781353166, "2": 0}, "score": 4.959190767339197}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9863725637957762, "4": 0.013191784889371914, "3": 0.00042317430298442456, "1": 1.0215534561817859e-05, "2": 0}, "score": 4.985920972527011}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.989667453834473, "4": 0.0097086892062349, "3": 0.0004615639240326267, "1": 0.00015968251424544461, "2": 0}, "score": 4.988729423466641}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9844843120219561, "4": 0.015007540562900242, "3": 0.0003856992258044876, "1": 0.0001177425613866966, "2": 0}, "score": 4.983750014273556}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9655847795591348, "4": 0.033294302257965126, "3": 0.000806445692440347, "1": 0.0002990774464157833, "2": 0}, "score": 4.963895940747909}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9796784053296199, "4": 0.018940480915891934, "3": 0.0011022056173933007, "1": 0.00026655738745445687, "2": 7.353846855171132e-06}, "score": 4.9777667056613275}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9585506307415197, "4": 0.039590982551431994, "3": 0.0012301637357024625, "1": 0.0006053413767359714, "2": 0}, "score": 4.955526306841201}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.957894885395968, "4": 0.036940831314909946, "3": 0.004401605140164911, "1": 0.000735953956717519, "2": 1.5212136420280037e-05}, "score": 4.951265945139469}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9797881423143061, "4": 0.01889645009914521, "3": 0.0009744487806678147, "1": 0.00033478132515888173, "2": 4.322515644837117e-06}, "score": 4.9778025183163965}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.982397541634764, "4": 0.017092645426622498, "3": 0.00031858252861064623, "1": 0.00018023139587946708, "2": 0}, "score": 4.981549060990501}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9372256818328806, "4": 0.057351556236692004, "3": 0.0047930875152496135, "1": 0.0006150376946021624, "2": 1.0478772644543957e-05}, "score": 4.9305703929517755}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9412511387889756, "4": 0.05373221771075765, "3": 0.00455759138522391, "1": 0.0004464107793050408, "2": 1.0935469163506052e-05}, "score": 4.9353340396825836}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.876507910115866, "4": 0.11574821584507863, "3": 0.007331161626437644, "1": 0.0003781982609420348, "2": 2.4526460568867433e-05}, "score": 4.868001770119026}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9837164834711729, "4": 0.01570501799780724, "3": 0.00045643146528980363, "1": 0.00011914074888824485, "2": 0}, "score": 4.9829055060521545}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9439178404933017, "4": 0.05374433569210247, "3": 0.0021684568357623786, "1": 0.00015364512466878145, "2": 8.49723280350972e-06}, "score": 4.9412782541969085}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9415103668052353, "4": 0.05036493903761097, "3": 0.006926681780525511, "1": 0.0011527449127842159, "2": 3.5046388090269586e-05}, "score": 4.931064873994786}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9828265136825817, "4": 0.01590380325391315, "3": 0.0009605644284240822, "1": 0.00029321219384101816, "2": 7.405874658012624e-06}, "score": 4.980979839807762}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9783808397980278, "4": 0.018301041649810758, "3": 0.002863758374180167, "1": 0.00044203137245519744, "2": 7.706241292202563e-06}, "score": 4.974180078033883}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.987233770548382, "4": 0.011800472570086677, "3": 0.00060481616839436, "1": 0.00034617687988195805, "2": 0}, "score": 4.985604975047849}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9848371957238128, "4": 0.014464053160104313, "3": 0.000565979046932624, "1": 0.0001263505968952444, "2": 3.1352990427235876e-06}, "score": 4.983889127518204}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9437029197697085, "4": 0.053162346807287514, "3": 0.002741211234153062, "1": 0.0003796968829516531, "2": 1.2459402490104919e-05}, "score": 4.939798982756355}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9889958411247156, "4": 0.010224504887357204, "3": 0.0006302266760741984, "1": 0.00014735380886704422, "2": 1.1371743645821798e-06}, "score": 4.987922203693148}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.994638843072679, "4": 0.005172490422321185, "1": 0.00010165081502177752, "3": 8.542301474290107e-05, "2": 0}, "score": 4.9942500511303045}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9896846182808039, "4": 0.00983337074239847, "3": 0.0002876710264459535, "1": 0.00019212410779384365, "2": 1.0312199903372215e-06}, "score": 4.988819683869108}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9974670269038102, "4": 0.0024771043544304953, "1": 2.9532653750249463e-05, "3": 2.5258722913003478e-05, "2": 0}, "score": 4.997354244734298}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9663731139678557, "5": 0.021414076346315196, "3": 0.006239638693249544, "4": 0.004403762455182608, "2": 0.0015664709378911692}, "score": 1.1129136727703481}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9907951226671614, "4": 0.009062934637059435, "3": 0.0001001576613526497, "1": 3.8534138318261095e-05, "2": 0}, "score": 4.990582582871917}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9888736616976058, "4": 0.010912534459726056, "3": 0.00017736638377239067, "1": 3.375925351511793e-05, "2": 0}, "score": 4.988597665220873}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9565400658520152, "4": 0.04148451723630039, "3": 0.001166654065748742, "1": 0.0007968381291419531, "2": 5.7176424306994155e-06}, "score": 4.952977377315426}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9745832424552525, "4": 0.023221688218350016, "3": 0.0016627623389805556, "1": 0.0005238225898286287, "2": 6.878382743521953e-06}, "score": 4.971336815562645}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8956087807360946, "4": 0.09683649899827151, "3": 0.0068948329205700985, "1": 0.0006327171981658329, "2": 2.4041044519757454e-05}, "score": 4.886770488927633}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9231076229783806, "4": 0.07369357951997141, "3": 0.003149885109450739, "1": 4.158204892720122e-05, "2": 5.073168423249086e-06}, "score": 4.919824921590978}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9928405101359429, "4": 0.006925373453912506, "3": 0.0001759898913653054, "1": 5.5515238906987475e-05, "2": 0}, "score": 4.992500566224607}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.977756350845679, "4": 0.02073958678410531, "3": 0.0013882577989918375, "1": 0.00010782284518531094, "2": 0}, "score": 4.976052415094109}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9820213544385551, "4": 0.017324181134276837, "3": 0.0005879968307271417, "1": 6.201886158943625e-05, "2": 0}, "score": 4.981251666351545}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9468471227859226, "4": 0.05002318905335948, "3": 0.0029284863310661486, "1": 0.0001904427373352849, "2": 9.175717182945482e-06}, "score": 4.9433304504544635}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9888258656442881, "4": 0.010928415011287879, "3": 0.00020096315000927263, "1": 4.288905040170032e-05, "2": 0}, "score": 4.988498081011348}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9949500570528845, "4": 0.00474512264522156, "3": 0.00015553123163260767, "1": 0.00014802505618237148, "2": 0}, "score": 4.9943517075272625}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9790561555346243, "4": 0.019077726046830463, "3": 0.001016446050588353, "1": 0.0008401511851503035, "2": 5.749285337557398e-06}, "score": 4.97551143688703}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9649020494071268, "4": 0.031581698107136895, "3": 0.002278717031218328, "1": 0.0012203153134290367, "2": 1.1348193383116226e-05}, "score": 4.958945320925633}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9854641150400708, "4": 0.01214512286585406, "3": 0.0019526770534061193, "1": 0.0004354859604343397, "2": 2.316986822132492e-06}, "score": 4.982200623204044}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.972857887962772, "4": 0.01574750246398302, "1": 0.007399185147779986, "3": 0.003991301143946873, "2": 3.2399715793631673e-06}, "score": 4.9466633876295045}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9936770703834814, "4": 0.00598560595190638, "3": 0.00016858230001920853, "1": 0.00016801320171692965, "2": 0}, "score": 4.993005171547813}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964479460224993, "4": 0.003019802944167236, "1": 0.00038565842098501046, "3": 0.00014539941736371723, "2": 0}, "score": 4.995146758746302}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9729326938816542, "4": 0.02654380212939329, "3": 0.00044838962717797404, "1": 7.28258196586375e-05, "2": 0}, "score": 4.972268051871885}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8925522264585554, "4": 0.09338833822009808, "3": 0.011500911337657098, "1": 0.0024615599598328255, "2": 9.268193317668259e-05}, "score": 4.873485011717074}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.982298036680242, "4": 0.014737883373322415, "3": 0.0015205593779720151, "1": 0.0014199092753622831, "2": 1.0919678821834191e-05}, "score": 4.976508303585269}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9890410852578341, "4": 0.01026307270661892, "1": 0.00043824387951464313, "3": 0.0002495098910678424, "2": 0}, "score": 4.9874848307671815}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.993533719952553, "4": 0.006165444773728659, "1": 0.00018204202335231868, "3": 0.00011510198459852334, "2": 0}, "score": 4.992876156867665}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9919471850416937, "4": 0.007506321851189587, "1": 0.0003267196807907866, "3": 0.00021536764789413718, "2": 0}, "score": 4.990756023402946}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9532949632361729, "4": 0.04364958518277442, "3": 0.0029181103867642333, "1": 0.0001279278659708172, "2": 6.416556210466664e-06}, "score": 4.9499830830218805}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9807150769895873, "4": 0.01857153586968751, "3": 0.0005797076112898612, "1": 0.00012966297161012323, "2": 0}, "score": 4.979750315687264}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9690086833364444, "4": 0.02698409123906996, "3": 0.003723071050750836, "1": 0.00027636309368613536, "2": 4.715498127769904e-06}, "score": 4.964450058446433}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.994394656889991, "4": 0.005438943209202694, "3": 0.00011889164807575724, "1": 4.6199111114849204e-05, "2": 0}, "score": 4.994138469376613}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9826116893224105, "4": 0.016396353769487906, "3": 0.0008638561466113357, "1": 0.00012491500649143772, "2": 2.2635198511413945e-06}, "score": 4.981369466170038}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9869222684695707, "4": 0.012744429561274657, "3": 0.00026986438579000484, "1": 6.156161590925361e-05, "2": 0}, "score": 4.986469569820861}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9496840392225697, "4": 0.04893169171946078, "3": 0.0011312794840965638, "1": 0.00024895908307559695, "2": 0}, "score": 4.947809702627532}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.697397402008924, "4": 0.27821360417151125, "3": 0.022691617405163667, "1": 0.0016276939833268357, "2": 6.429311555671756e-05}, "score": 4.669697725635009}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9796980921649778, "4": 0.01964832865518668, "3": 0.00047053274744030443, "1": 0.00017975423520491385, "2": 0}, "score": 4.97869151875739}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9934596984867701, "4": 0.00643988433133501, "1": 5.26965273117958e-05, "3": 4.632211801650488e-05, "2": 0}, "score": 4.9932566758926}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8327920481982147, "4": 0.14439880906929167, "3": 0.022184946626310004, "1": 0.0005904355931467476, "2": 3.097683161981162e-05}, "score": 4.808776092504203}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9784939354186607, "4": 0.019540813513395084, "3": 0.0017608375543062332, "1": 0.0001988900298114491, "2": 3.161623172693396e-06}, "score": 4.976132410017307}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9879031049071143, "4": 0.01122533501909597, "3": 0.0008048696653914363, "1": 6.363626790947821e-05, "2": 0}, "score": 4.986910340600825}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9831853324666501, "4": 0.016391943743498998, "3": 0.0002880239274084634, "1": 0.00013001262458909116, "2": 0}, "score": 4.982511875932331}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9582735969298838, "4": 0.03746765693089629, "3": 0.004050366127896282, "1": 0.00019693929971108617, "2": 1.0515212918388729e-05}, "score": 4.953612265043923}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9753902116235273, "4": 0.022488306859351957, "3": 0.0015442086507709272, "1": 0.0005671807624599776, "2": 6.152592624623297e-06}, "score": 4.972135985240793}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9145819759342364, "4": 0.07650247390844858, "3": 0.007892636837658526, "1": 0.0009801514082686143, "2": 3.5032337306015915e-05}, "score": 4.903685805303539}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8635551719824198, "4": 0.1168367053293425, "3": 0.014205515134857662, "1": 0.005272844018708545, "2": 0.00012492450039269475}, "score": 4.833285308086821}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9782793967481549, "4": 0.020330822392413787, "3": 0.0011188554900929321, "1": 0.0002659144280497256, "2": 3.7590022305244737e-06}, "score": 4.976356502308292}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9800845250361032, "4": 0.019076266656610268, "3": 0.0006729765990659021, "1": 0.00016199679611424844, "2": 2.147214794621949e-06}, "score": 4.978923307314662}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9188324141517703, "4": 0.06480717217731452, "3": 0.015370138660029653, "1": 0.0009009155805757952, "2": 7.581760775570515e-05}, "score": 4.900620089571944}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.965961606870429, "4": 0.03122753629025485, "3": 0.0023591176664495097, "1": 0.00043508767302482014, "2": 1.0539294000176165e-05}, "score": 4.962282029262745}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9865576946925032, "4": 0.010737921902614135, "3": 0.0025904465629644413, "1": 9.95856978069921e-05, "2": 6.561567732155556e-06}, "score": 4.983663030218958}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9860314710384225, "4": 0.013524973683751327, "3": 0.00038451067733589106, "1": 5.5912253381985664e-05, "2": 0}, "score": 4.985482310473606}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9820543548386192, "4": 0.016728179272524523, "3": 0.000989284107651452, "1": 0.0002173777357445913, "2": 4.629267082095889e-06}, "score": 4.980409732802388}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9659055489152517, "4": 0.032154322160300876, "3": 0.001816899867104451, "1": 0.00011887262693379692, "2": 2.30152180379878e-06}, "score": 4.963729408499594}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9293688213196611, "4": 0.06522219851331348, "3": 0.004598879003853274, "1": 0.0007885978995830581, "2": 1.771497909005608e-05}, "score": 4.922372212867235}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.990380552252651, "4": 0.009292441046642222, "3": 0.0002773198568724075, "1": 4.685541379653477e-05, "2": 0}, "score": 4.989965469172355}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943213424769644, "4": 0.0055840832777281964, "3": 8.04330818992388e-05, "1": 1.2332136243953246e-05, "2": 0}, "score": 4.994205711531472}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9800241752493491, "4": 0.01916996016333567, "3": 0.0006239221231672049, "1": 0.00017630043520774438, "2": 0}, "score": 4.978876874672214}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9913589225842799, "4": 0.007835993565861806, "3": 0.0004709135624518863, "1": 0.0003300943616447563, "2": 0}, "score": 4.989901760702982}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9708182367751933, "4": 0.02479947984557271, "3": 0.003897038785574834, "1": 0.0004495886070037564, "2": 1.722484051557523e-05}, "score": 4.96555577878724}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9923838296331841, "4": 0.0070117406444016855, "3": 0.0005254308317511289, "1": 7.651115582391687e-05, "2": 1.1579550459385888e-06}, "score": 4.99162786807057}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978791140636705, "4": 0.0018150014724471581, "1": 0.0002440344876087971, "3": 6.066412839947386e-05, "2": 0}, "score": 4.997087528866571}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9862076698966853, "4": 0.012030112468942197, "1": 0.0012137473763107554, "3": 0.0005426330224142461, "2": 0}, "score": 4.982029527083102}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9181808072193459, "4": 0.07221203191104773, "3": 0.00769615519616657, "1": 0.0018629295563885205, "2": 4.3342581487720055e-05}, "score": 4.904813461157734}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5655703092678355, "4": 0.31353132614303314, "3": 0.1170250107424277, "1": 0.0034606830365073054, "2": 0.0004078266301376566}, "score": 4.437349714756378}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9438256600904981, "4": 0.05055151316186345, "3": 0.0050801118495813835, "1": 0.0005151141661621913, "2": 1.8357708315127926e-05}, "score": 4.9371721526301044}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9557272002876178, "4": 0.04297104767273088, "3": 0.0010305032539467272, "1": 0.0002638971800997396, "2": 0}, "score": 4.953912018278312}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9730767083072003, "4": 0.02591416625894011, "3": 0.000858789258162126, "1": 0.00014302401567811677, "2": 0}, "score": 4.971795952929518}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9104273584864758, "4": 0.08387181982981373, "3": 0.00525177061099802, "1": 0.0004356885084947161, "2": 7.674602940239655e-06}, "score": 4.903858314255205}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9609557181516439, "4": 0.03691502607938647, "3": 0.0017508130481439243, "1": 0.0003701450507852607, "2": 4.895955998642533e-06}, "score": 4.958087937180337}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8976130729334201, "4": 0.0904599108908324, "3": 0.010921237400728721, "1": 0.0009757358047981458, "2": 2.2866376533966395e-05}, "score": 4.883725237502189}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9786164250846336, "4": 0.019362400733347503, "1": 0.0010145460580250106, "3": 0.0009907126750823083, "2": 0}, "score": 4.974597585393556}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9155670672877345, "4": 0.07711842897979174, "3": 0.005710739808766229, "1": 0.0015676656707084959, "2": 2.305635780208738e-05}, "score": 4.905119022218667}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9377629504358093, "4": 0.05811759622278692, "3": 0.0036679879858081605, "1": 0.00043831531908917104, "2": 7.165619775545733e-06}, "score": 4.932771267345161}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9291907434355091, "4": 0.06100197733538568, "3": 0.009081417374843498, "1": 0.0007158866597302267, "2": 5.7347522956907e-06}, "score": 4.917954089108174}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8068638630888395, "4": 0.18254044756917098, "3": 0.009824592479505212, "1": 0.0007547521052854732, "2": 1.0494974861269275e-05}, "score": 4.794758673509007}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9700279320223234, "4": 0.02886855033821903, "3": 0.000810743362236001, "1": 0.00028511726676206387, "2": 0}, "score": 4.96836925167329}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9671456706923421, "4": 0.03174896984489158, "3": 0.0007157122909788925, "1": 0.0003761072183639996, "2": 0}, "score": 4.9653147070624435}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9317611164240781, "4": 0.05887142796462185, "3": 0.009163491543984222, "1": 0.00018003307031086348, "2": 2.0548594777849897e-05}, "score": 4.922019547120575}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8400506007256197, "4": 0.14594188273222633, "3": 0.013800031558137983, "1": 0.00017382178634949033, "2": 3.0796685112327385e-05}, "score": 4.8256698772312765}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9121818425701937, "4": 0.07779535919708659, "3": 0.009575603664518702, "1": 0.0003821998188976693, "2": 4.9789621463512915e-05}, "score": 4.901373765709394}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9793547260424674, "4": 0.01980236309838141, "3": 0.0006826805662243916, "1": 0.0001530951399636679, "2": 0}, "score": 4.978219739803827}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9807502764660839, "4": 0.018359263664746498, "3": 0.0007877789718720084, "1": 9.299293829554398e-05, "2": 0}, "score": 4.97969300990504}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9855737559925718, "4": 0.01365381239513836, "3": 0.0004041558447724363, "1": 0.00036339847445080267, "2": 0}, "score": 4.984084204391514}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9846614770526939, "4": 0.014423347950140778, "3": 0.0007029201199446124, "1": 0.00020763537943958, "2": 2.5970379821394223e-06}, "score": 4.983332445468806}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9784100488156199, "4": 0.01928941073932459, "3": 0.0017678515203426357, "1": 0.000520643818353192, "2": 8.87194949997632e-06}, "score": 4.975065615977367}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969632116980803, "4": 0.0028457034033850183, "1": 0.00011501402275899503, "3": 7.402216371070724e-05, "2": 0}, "score": 4.996546189102293}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9907762808954712, "4": 0.008275176737012151, "1": 0.000540266781818017, "3": 0.0004044451217558708, "2": 0}, "score": 4.988754822817958}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6070316971066131, "4": 0.3560953667056447, "3": 0.03382261897040514, "1": 0.0026524742376555594, "2": 0.0003823318152829991}, "score": 4.564495747779021}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8733218323907864, "4": 0.1163508946457964, "3": 0.00755768010727641, "1": 0.002677178600523929, "2": 4.9402624877991845e-05}, "score": 4.857670701047672}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9714517488962239, "4": 0.026859556488307717, "3": 0.00123569266966909, "1": 0.00044016891807879366, "2": 5.398621039825524e-06}, "score": 4.968891955367065}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9754908185581647, "4": 0.023661410661470372, "3": 0.0006466508846844237, "1": 0.00018921795618677672, "2": 0}, "score": 4.974288109723052}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9786592346178558, "4": 0.02052957396486065, "3": 0.0005876560677440625, "1": 0.0002179802708409959, "2": 0}, "score": 4.97742306739965}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9635966989446874, "4": 0.03127599214096363, "3": 0.0033408550558888944, "1": 0.0017450930516878086, "2": 3.603910352422779e-05}, "score": 4.954953568506194}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9845114605356664, "4": 0.014714983773729902, "3": 0.00068667565165493, "1": 8.016600586249662e-05, "2": 3.4960423024536967e-06}, "score": 4.983580459934675}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9658041293279629, "4": 0.032313919413104464, "3": 0.0016863699817016682, "1": 0.00018863794782965498, "2": 4.414716230175272e-06}, "score": 4.963545452504033}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9883127981725442, "4": 0.010692183697680846, "3": 0.0006467918699441194, "1": 0.000340058804805098, "2": 4.4519649386390054e-06}, "score": 4.986640591811645}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9950091827217994, "4": 0.004833970980138998, "3": 0.00013161481097540532, "1": 2.364634501003211e-05, "2": 0}, "score": 4.994808205788138}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9927529692906786, "4": 0.006017454196811977, "1": 0.0010465774606924895, "3": 0.0001786594639655233, "2": 2.2595621553957084e-06}, "score": 4.989432116364552}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9972446961366097, "4": 0.00262787169986142, "3": 8.449890350141118e-05, "1": 4.2010456768096334e-05, "2": 0}, "score": 4.997035085930031}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9972923532059502, "4": 0.00258434445222768, "3": 7.055747020586209e-05, "1": 5.220585002033011e-05, "2": 0}, "score": 4.997065715625636}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971332666500644, "4": 0.002568336155620312, "1": 0.00022092174813169636, "3": 7.58333794583186e-05, "2": 0}, "score": 4.996396304175427}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982179950596054, "4": 0.0017210701524062138, "1": 3.364042799971715e-05, "3": 2.5899911661953113e-05, "2": 0}, "score": 4.998092565652453}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9857674018195515, "4": 0.01330675071459302, "3": 0.0007401468096678483, "1": 0.00017701492622342985, "2": 0}, "score": 4.984504761373719}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9810199168730349, "4": 0.017901710715566083, "3": 0.0009635669367758687, "1": 0.00010983756119513584, "2": 3.313866246212357e-06}, "score": 4.979721830026313}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9840356607371729, "4": 0.01452913986980071, "3": 0.0011900455443833804, "1": 0.00023292687380246382, "2": 6.0486890218840535e-06}, "score": 4.982140805139946}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9934500606829468, "4": 0.006105341104544768, "3": 0.0003747726434469049, "1": 6.533948720005911e-05, "2": 0}, "score": 4.992883723735563}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.977212803943187, "4": 0.020122191866443994, "3": 0.002000607489086454, "1": 0.0006430185403535313, "2": 1.668490732777859e-05}, "score": 4.973254338747814}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.977722051754501, "4": 0.02049396144271917, "3": 0.0015205745836418226, "1": 0.000248312630212491, "2": 7.125939363560746e-06}, "score": 4.97545006529848}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9948485788148923, "4": 0.005025974065206978, "3": 9.859771214721388e-05, "1": 2.5634460458875858e-05, "2": 0}, "score": 4.994674286198201}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9808877666954849, "4": 0.017697483936268465, "3": 0.0013216200292608688, "1": 8.975875379785544e-05, "2": 2.3810642651514544e-06}, "score": 4.979293077307289}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9942479229088642, "4": 0.005585853712726358, "3": 0.00014202186973547818, "1": 2.1230239523499754e-05, "2": 0}, "score": 4.994045163896288}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9927250157461291, "4": 0.006920660956282957, "3": 0.00028761838746472763, "1": 6.297769133982747e-05, "2": 0}, "score": 4.992252162625544}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9385519595721102, "4": 0.05351103417951261, "3": 0.007595111213901023, "1": 0.00032583155910165495, "2": 1.0929401662007712e-05}, "score": 4.929962269372422}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9727357076035215, "4": 0.025929548288595002, "3": 0.0012622029646766832, "1": 6.673419952102239e-05, "2": 0}, "score": 4.971278942202403}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958720823709692, "4": 0.004008552802238928, "3": 0.00011000321118577495, "1": 8.147222388726837e-06, "2": 0}, "score": 4.995738846711119}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9848789261295642, "4": 0.014747480859041104, "3": 0.00028221707885034555, "1": 8.6454352506998e-05, "2": 0}, "score": 4.984342190512067}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9887125823544184, "4": 0.01098237021083765, "3": 0.0002578648364627669, "1": 4.584676123654918e-05, "2": 0}, "score": 4.9883184974667065}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9130997857500974, "4": 0.07435758453857652, "3": 0.012446970736680553, "1": 7.775279958726029e-05, "2": 1.3536104973446137e-05}, "score": 4.900396419200164}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9970911887134849, "4": 0.002578511460099768, "3": 0.0002717030000007991, "1": 5.758646502960307e-05, "2": 0}, "score": 4.996647733292779}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9462327852484328, "4": 0.050285852694283664, "3": 0.0033555955940736994, "1": 0.00011874906366582233, "2": 3.4998235675882317e-06}, "score": 4.942517258192291}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9944494714229976, "4": 0.0046136452857654, "1": 0.00047755367308208424, "3": 0.00045547214304772775, "2": 2.461056078351642e-06}, "score": 4.992557802175148}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982499529213396, "4": 0.0017214959978368272, "3": 1.6551530219874928e-05, "1": 1.164483294934092e-05, "2": 0}, "score": 4.998198820971017}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9779093239922858, "4": 0.021192774094583706, "3": 0.0008804618135677437, "1": 1.6726588146761063e-05, "2": 6.323675787019571e-07}, "score": 4.976977496954823}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.982887086164285, "4": 0.016926351687583076, "3": 0.0001515617386780837, "1": 3.3858211604670194e-05, "2": 0}, "score": 4.982635072154459}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8738847036929461, "4": 0.12072616466655801, "3": 0.005287500182999009, "1": 9.86968033092697e-05, "2": 2.417276656571391e-06}, "score": 4.868296727783922}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972834666725712, "4": 0.0026517393388692345, "3": 5.989772700841496e-05, "1": 4.665567875458308e-06, "2": 0}, "score": 4.997209802291931}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941078313160764, "4": 0.00576015842679888, "3": 9.909099386712777e-05, "1": 3.218358557949567e-05, "2": 0}, "score": 4.99391292076502}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"5": 0.991733277835329, "4": 0.007945965209228155, "3": 0.0002704138485649094, "1": 4.7127634935903053e-05, "2": 0}, "score": 4.9913246686586135}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9672542901516293, "4": 0.0278200582130448, "3": 0.004427416712013902, "1": 0.0004801084221932574, "2": 1.3223090186319072e-05}, "score": 4.961364815959411}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9994885626686809, "4": 0.00045411880914812686, "1": 3.86791446932833e-05, "3": 1.8210649457113963e-05, "2": 0}, "score": 4.999354743036526}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931123880789864, "4": 0.006371387596976018, "3": 0.0003518146793937268, "1": 0.00016159764257656344, "2": 0}, "score": 4.992278570761256}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9754621268686748, "4": 0.023430330985352625, "3": 0.0008140908409253153, "1": 0.0002846793781266717, "2": 0}, "score": 4.973802540018085}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9922523546308591, "4": 0.0071274795952614625, "3": 0.0003148277166594281, "1": 0.00029915387046609913, "2": 0}, "score": 4.991046194117547}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9886524536497395, "4": 0.009824107156624299, "3": 0.0013348204373954606, "1": 0.00018617341125776028, "2": 1.3719259533205337e-06}, "score": 4.986757428330866}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.992175736159976, "4": 0.00722448520084804, "3": 0.0004509021068519619, "1": 0.00014622909825215958, "2": 0}, "score": 4.991288771130036}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9853683917052936, "4": 0.013646334884985319, "1": 0.0006249161982611076, "3": 0.00035179307863556213, "2": 0}, "score": 4.9831502698613725}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9739286623133565, "4": 0.023193435336131784, "3": 0.0025562695251547148, "1": 0.00031607817049036344, "2": 3.166381831559577e-06}, "score": 4.970420143141328}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9630251088035349, "4": 0.03524228637186165, "3": 0.001486794230545016, "1": 0.0002383589088107966, "2": 0}, "score": 4.960830397652257}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9871566350640548, "4": 0.012104899390825652, "3": 0.0006472836186060994, "1": 8.885079995245819e-05, "2": 1.137136838447333e-06}, "score": 4.98624170233437}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9844615539611651, "4": 0.0150616229019901, "3": 0.0003881564802620439, "1": 8.412380290971528e-05, "2": 0}, "score": 4.98382549544744}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9909669454015566, "4": 0.008690155028417851, "1": 0.00018476404118916435, "3": 0.00015339550069535832, "2": 0}, "score": 4.990263951656291}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9825767060211945, "4": 0.01609770763577888, "1": 0.0007235755459482734, "3": 0.0005889711834751127, "2": 0}, "score": 4.979829784801666}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9735877427538244, "4": 0.02439575834778807, "3": 0.0018311988817339606, "1": 0.0001714594092722226, "2": 8.197584666083032e-06}, "score": 4.971231251154954}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9921084957123784, "4": 0.007633233773103346, "3": 0.00023956878017097126, "1": 1.7239349938899352e-05, "2": 0}, "score": 4.991818659302535}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9932723085337112, "4": 0.0064980230142362705, "3": 0.00020628331882054898, "1": 2.1788963016954503e-05, "2": 0}, "score": 4.993002243326445}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9928434509338891, "4": 0.007014505918875809, "3": 0.00011279607676018333, "1": 2.680296613212055e-05, "2": 0}, "score": 4.9926526721054385}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9957526874535985, "4": 0.004180164830871895, "3": 5.7696791072011714e-05, "1": 7.654039578636014e-06, "2": 0}, "score": 4.995673817655018}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9947441760294536, "4": 0.004960100382712475, "3": 0.00021874738217459705, "1": 7.250282727264015e-05, "2": 0}, "score": 4.9943123681009185}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9339974228671325, "4": 0.05923701968584066, "3": 0.005814066726762369, "1": 0.0009238455074790645, "2": 2.5031037578095347e-05}, "score": 4.925364176606866}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9847553345343211, "4": 0.012954798745224524, "3": 0.0017954754813547147, "1": 0.0004815287592774542, "2": 1.1021154452185174e-05}, "score": 4.981495037717943}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985554529639461, "4": 0.0013476121910267387, "1": 5.0076886681892e-05, "3": 4.599540765710842e-05, "2": 0}, "score": 4.998360088032424}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9953642058183855, "4": 0.003896158154324375, "3": 0.00048771253173358236, "1": 0.0002477059997305225, "2": 3.5618196715355893e-06}, "score": 4.994126903473422}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9044824747105533, "4": 0.088210347875474, "3": 0.006387474599852157, "1": 0.0008910589242179991, "2": 2.3251637460552776e-05}, "score": 4.895380148178917}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9236258902579292, "4": 0.07133304462140978, "3": 0.003925604212911352, "1": 0.0010998791157383553, "2": 1.1624646680825518e-05}, "score": 4.916381025657337}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9555163604994431, "4": 0.04134459001707478, "3": 0.003028891403019063, "1": 0.00010411130403564108, "2": 3.3444543558729602e-06}, "score": 4.952171019348366}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9186540089205419, "4": 0.0778907870084523, "3": 0.0029575900930676542, "1": 0.00048417264998994603, "2": 9.187717685923974e-06}, "score": 4.914229414217752}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9598044338620019, "4": 0.03818200681967501, "3": 0.001526996263047167, "1": 0.0004732399520034394, "2": 0}, "score": 4.956870466226984}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9892582570238594, "4": 0.00981775988750993, "3": 0.0008091760906543473, "1": 0.00011262115302498163, "2": 0}, "score": 4.988113377336767}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9980740515235045, "4": 0.00183396498037553, "3": 5.304250418819033e-05, "1": 3.669413958452573e-05, "2": 0}, "score": 4.997913168764108}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9908899215253907, "4": 0.00861349172310104, "3": 0.00043976282960606685, "1": 5.5226370075138024e-05, "2": 0}, "score": 4.990286061618867}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992089078085545, "4": 0.000772696200662554, "3": 1.0494722984895116e-05, "1": 6.232880328406262e-06, "2": 0}, "score": 4.999181381466281}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963202545179423, "4": 0.003543533095430981, "3": 7.142918633103213e-05, "1": 6.1015294238253944e-05, "2": 0}, "score": 4.996069532545321}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9262524845502494, "4": 0.06955352353486373, "3": 0.0035181429486258703, "1": 0.0006330032509824703, "2": 0}, "score": 4.920874787387623}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9869789391732264, "4": 0.01229792167983206, "3": 0.0005665357911821913, "1": 0.00014282592170322296, "2": 0}, "score": 4.98599751013261}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9885792842120816, "4": 0.010323669607613226, "3": 0.0009680811902303835, "1": 0.00012204289215232192, "2": 3.185908711181747e-06}, "score": 4.987242391052343}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990853281075322, "4": 0.00868979091855032, "3": 0.00028511241980972823, "1": 0.00016686107132645822, "2": 0}, "score": 4.990072490770531}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9871128418185258, "4": 0.012056745296720172, "3": 0.0005773610792024688, "1": 0.00024026429773028323, "2": 0}, "score": 4.985827294120367}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9944732887730497, "4": 0.0053999995972243186, "3": 7.29687712091731e-05, "1": 5.2431972001729206e-05, "2": 0}, "score": 4.9942443274273165}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9784270488379053, "4": 0.020740437124595317, "3": 0.0006946072361403688, "1": 0.00013658860951397633, "2": 0}, "score": 4.977323964073703}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.985183002230699, "4": 0.013858410144346175, "3": 0.0009036187710124851, "1": 5.4349942628010266e-05, "2": 4.359113238274124e-07}, "score": 4.984115641902307}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984591883709961, "4": 0.001516342642226829, "3": 1.577497080897314e-05, "1": 8.537041830857007e-06, "2": 0}, "score": 4.998417959000492}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970064655862025, "4": 0.0029494711378713293, "3": 3.699029415008507e-05, "1": 6.626783597908527e-06, "2": 0}, "score": 4.99695003977855}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9678455308570435, "4": 0.029077994314463635, "3": 0.00286329849151484, "1": 0.0002049878190212103, "2": 5.106905063278227e-06}, "score": 4.964360026882632}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936497581534132, "4": 0.0061930969647224264, "3": 0.0001335514180959581, "1": 2.0483169684860364e-05, "2": 0}, "score": 4.993457847172326}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9627029325794894, "4": 0.02955897673629845, "3": 0.007241098916902487, "1": 0.0004691562919199084, "2": 1.9229942278618374e-05}, "score": 4.954024114788378}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9792538841403484, "4": 0.019368785569351663, "3": 0.0012451136102698416, "1": 0.0001295402388991194, "2": 1.4652942242419365e-06}, "score": 4.9776184032644375}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9505044484014067, "4": 0.04285523804438509, "3": 0.0054607594799867855, "1": 0.0011435080554157676, "2": 3.3554418642987096e-05}, "score": 4.941548401880039}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9522164181850631, "4": 0.04128929143186392, "3": 0.0050065561272670065, "1": 0.001421606086058668, "2": 4.417718847304009e-05}, "score": 4.942877386506528}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959342785163741, "4": 0.003977182599224719, "3": 5.662539491324806e-05, "1": 3.156520978625412e-05, "2": 0}, "score": 4.995783304303215}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9956034303344594, "4": 0.004220737935454867, "3": 0.00013559649918649328, "1": 3.977344815854908e-05, "2": 0}, "score": 4.9953489731257745}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9929861228593729, "4": 0.006807883500533713, "3": 0.00015259258978870844, "1": 5.1672853072186305e-05, "2": 0}, "score": 4.992680227257589}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970266076133792, "4": 0.002888902808446727, "1": 4.3775730163999955e-05, "3": 3.914820444707649e-05, "2": 0}, "score": 4.996857692942271}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9536829474216324, "4": 0.03688221951601817, "3": 0.007047290938844325, "1": 0.002312131852893307, "2": 5.693752180388374e-05}, "score": 4.939602742925949}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.984791170432975, "4": 0.014285553458753273, "3": 0.000816645877124402, "1": 0.00010138301355718543, "2": 2.5713512989070035e-06}, "score": 4.983667864976264}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9133009911908752, "4": 0.07497046822413561, "3": 0.01109014392273815, "1": 0.0005849372391453076, "2": 4.1469680006521746e-05}, "score": 4.900383891562239}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.969970724371961, "4": 0.027143713673031804, "3": 0.0023869783538880817, "1": 0.0004834899641289496, "2": 9.238971389408185e-06}, "score": 4.966120454495098}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9794140689018609, "4": 0.019529697953182743, "3": 0.0009861047220753956, "1": 6.205329161106564e-05, "2": 0}, "score": 4.978249703799725}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"5": 0.993324534575427, "4": 0.00599996285863945, "3": 0.0005328966793300796, "1": 0.0001377650307130149, "2": 0}, "score": 4.99238314678776}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9955476594866963, "4": 0.004272509155868481, "3": 0.0001451377886803927, "1": 3.0739994462307056e-05, "2": 0}, "score": 4.9953142367634085}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984566927253736, "4": 0.0014863522723206207, "3": 3.6759936055182325e-05, "1": 1.4545178410313037e-05, "2": 0}, "score": 4.998381938000059}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978191662808944, "4": 0.002086901184740747, "3": 7.003391032503631e-05, "1": 2.199012651757728e-05, "2": 0}, "score": 4.997685066070493}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939225468853645, "4": 0.005691109833724163, "3": 0.00031190621758589763, "1": 6.426219800440216e-05, "2": 0}, "score": 4.993427962069486}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9031059060453062, "4": 0.08283775029950009, "3": 0.013258187405314715, "1": 0.0007346943467536096, "2": 5.657722720044556e-05}, "score": 4.887536591547135}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8832465400894276, "4": 0.10512139014191413, "3": 0.011590200759435957, "1": 3.4170324337612086e-05, "2": 5.7553597896200626e-06}, "score": 4.871544011330749}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9354324436865846, "4": 0.05788820085835096, "3": 0.00626741681786472, "1": 0.00034637436086290427, "2": 3.483524138934848e-05}, "score": 4.928084752452144}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9297632361797424, "4": 0.06514801786819802, "3": 0.004715603855222916, "1": 0.0003368822820701089, "2": 2.1623843204730983e-05}, "score": 4.924007261535903}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.948409312186994, "4": 0.04851366830602122, "3": 0.0025912963687976308, "1": 0.0004727972066455155, "2": 1.0364749295205271e-05}, "score": 4.944381313432324}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8668266625885774, "4": 0.11900473461278706, "3": 0.013752055158029271, "1": 0.00036542057772244403, "2": 4.261386023402658e-05}, "score": 4.851900370377402}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9877914238347598, "4": 0.011617523200230387, "3": 0.000456067971158521, "1": 0.00013268933355499324, "2": 1.2838373951592618e-06}, "score": 4.986935718792308}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7863362178000327, "4": 0.15988694615971294, "3": 0.05227177649185739, "1": 0.0011740338792833318, "2": 0.0002653786191932331}, "score": 4.730059508684951}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9890093731528876, "4": 0.010492394684751412, "3": 0.00037611169406652836, "1": 0.00011721086269563755, "2": 0}, "score": 4.988286480967575}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9157874662263925, "4": 0.0772863363756914, "3": 0.0066513229782725, "1": 0.0002537685314322452, "2": 1.7248420222242584e-05}, "score": 4.908343844720682}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9442237194233325, "4": 0.05016511069443993, "3": 0.004617573168980846, "1": 0.0009629840587899455, "2": 2.6673366493729814e-05}, "score": 4.936667537148149}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8534599434091127, "4": 0.13313451112501362, "3": 0.011124771393943226, "1": 0.002196737442508537, "2": 7.739232054932301e-05}, "score": 4.835595727002646}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7570665852755581, "4": 0.19586453630517503, "3": 0.04515228460802837, "1": 0.001768292300667642, "2": 0.00013997118191610983}, "score": 4.706335365407429}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9868248610881853, "4": 0.012293946404390873, "3": 0.0007170000841504614, "1": 0.00016028036418804163, "2": 2.1819949171534283e-06}, "score": 4.985624361115026}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9261965461468865, "4": 0.0692100289386702, "3": 0.004180583286314811, "1": 0.0003932448940853275, "2": 1.6222522556608463e-05}, "score": 4.920806890130388}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9201133812899382, "1": 0.040132556149849646, "4": 0.03665209463115751, "3": 0.00298955120950729, "2": 0.00010933871684767724}, "score": 4.796509935856919}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9783379328687876, "4": 0.019720323998468424, "3": 0.001457842027545564, "1": 0.0004786975402378731, "2": 4.109619963636055e-06}, "score": 4.975436846054858}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9524708244015117, "4": 0.03882474414205033, "3": 0.008360588998510792, "1": 0.00029477712371459063, "2": 3.622634287685637e-05}, "score": 4.943165560640565}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951799847361096, "4": 0.00451801066672291, "3": 0.0002472887192812419, "1": 5.263959314423352e-05, "2": 0}, "score": 4.994776842677377}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941083010321377, "4": 0.005429304163135496, "3": 0.00029189833036719233, "1": 0.00016832128401969836, "2": 0}, "score": 4.993313599495856}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9671752203454318, "4": 0.03161760478721284, "1": 0.0006257532086367096, "3": 0.0005558028016035937, "2": 0}, "score": 4.964766874142617}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9886126068156139, "4": 0.010678415690929581, "1": 0.0004192671297565907, "3": 0.0002830412248731948, "2": 0}, "score": 4.987078347164001}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9877636272813037, "4": 0.011611126030394004, "3": 0.00046825646968641006, "1": 0.00015247727338592087, "2": 0}, "score": 4.986842392557127}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939506887097906, "4": 0.005766545949375107, "1": 0.00013785750206929366, "3": 0.00012199920861675099, "2": 0}, "score": 4.993437875295826}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9746270714237578, "4": 0.024455361569623316, "1": 0.0005632828827355095, "3": 0.0003500676977645657, "2": 2.035312883057431e-06}, "score": 4.9725852057704865}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9228863298393617, "4": 0.06712388748974671, "3": 0.009150827194595076, "1": 0.0007967890454249916, "2": 3.965133265427252e-05}, "score": 4.911268124772018}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9979059424042904, "4": 0.0020410477500687483, "3": 3.924812050913363e-05, "1": 1.2721195736864023e-05, "2": 0}, "score": 4.9978295689675685}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.979063241968724, "4": 0.019469160074491114, "3": 0.001379082301411627, "1": 8.524270647552006e-05, "2": 1.791652821828587e-06}, "score": 4.97742629609998}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9181767901871016, "4": 0.07628984062120162, "3": 0.005128341327776555, "1": 0.00037403757413293095, "2": 1.8723746001796043e-05}, "score": 4.911900074507115}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9917134622106734, "4": 0.00794889781142219, "3": 0.00028918642749145617, "1": 4.1987777245463746e-05, "2": 0}, "score": 4.991304722002917}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9232173500713997, "4": 0.07292779769209147, "3": 0.0034005843312305242, "1": 0.0004271347588622291, "2": 1.5435862840772854e-05}, "score": 4.918515233871059}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945639586381028, "4": 0.00514488634664188, "3": 0.000255015813755814, "1": 3.4504458858591837e-05, "2": 7.376325766050526e-07}, "score": 4.994204846093792}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962584839792951, "4": 0.0035958387675071256, "3": 7.840640010087884e-05, "1": 5.8232147102854624e-05, "2": 0}, "score": 4.996014383819067}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.984977916852947, "4": 0.012942312454027355, "3": 0.0015323032245450866, "1": 0.0005371411225156626, "2": 7.819585577624746e-06}, "score": 4.98182101227972}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970395254728991, "4": 0.002772607682497076, "3": 0.00014418923343691384, "1": 4.2642378444801026e-05, "2": 0}, "score": 4.996768440991434}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8954827774451845, "4": 0.09528160585646805, "3": 0.008827512624761722, "1": 0.0003799077871828965, "2": 2.289243617498684e-05}, "score": 4.885474453010403}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9943666062078813, "4": 0.005357238188675453, "3": 0.00024407255995843025, "1": 2.979982610120426e-05, "2": 0}, "score": 4.994035403768533}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9775201544226299, "4": 0.02107134960128976, "3": 0.001178308904735407, "1": 0.0002199161985193299, "2": 5.416170727761746e-06}, "score": 4.975676001197211}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.975405062052548, "4": 0.023855587794777162, "3": 0.0006154652943736199, "1": 0.0001139163671833704, "2": 0}, "score": 4.974457561528171}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9901601928340453, "4": 0.009179701419386385, "3": 0.0005865028679162031, "1": 6.625113242741695e-05, "2": 0}, "score": 4.989382210255775}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9747924163107622, "4": 0.023418218293206554, "3": 0.001705315229497614, "1": 7.66663628916396e-05, "2": 3.4164074917443783e-06}, "score": 4.972854128875332}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9966692221885725, "4": 0.0032406423910110345, "3": 7.332734226527264e-05, "1": 1.5182137281877436e-05, "2": 0}, "score": 4.996551968769036}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993790159904288, "4": 0.0006088934892800688, "3": 8.348513991742076e-06, "1": 3.0638783802610856e-06, "2": 0}, "score": 4.999362153536674}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995158210124949, "4": 0.000469155822763851, "3": 1.1257488571061779e-05, "1": 3.4725269547535687e-06, "2": 0}, "score": 4.99949443894407}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9966188914643846, "4": 0.00330597447640093, "3": 5.997594456801806e-05, "1": 1.3932783076482325e-05, "2": 0}, "score": 4.996518338235968}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8079538729692196, "4": 0.16347653757703184, "3": 0.026158761415926747, "1": 0.00223048439412927, "2": 0.00017772289328676897}, "score": 4.774750243011345}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9965317572961584, "4": 0.0033603820705448554, "1": 7.18795324975164e-05, "3": 3.568653896812347e-05, "2": 0}, "score": 4.996280725625971}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9950684342977122, "4": 0.004537010336660281, "3": 0.00022264254718240242, "1": 0.0001705019200523508, "2": 7.112726547443425e-07}, "score": 4.994333559106413}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991440539310052, "4": 0.0008462307342699091, "3": 6.8357251484974716e-06, "1": 1.9395181345385403e-06, "2": 0}, "score": 4.999132338927215}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9953534563411535, "4": 0.004498856615209746, "3": 0.0001246889901342657, "1": 2.220835474542773e-05, "2": 3.750314304330895e-07}, "score": 4.995161804885007}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7922081706299959, "4": 0.17776157373238985, "3": 0.028922078893236586, "1": 0.0009080573686738253, "2": 0.0001945420933634033}, "score": 4.760177075166188}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9672729099759301, "4": 0.028518553600274433, "3": 0.0036902908606934012, "1": 0.00049652451503405, "2": 1.3860132560480806e-05}, "score": 4.962072888078699}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8900107479326941, "4": 0.09414250820629343, "3": 0.015598695344294058, "1": 0.00021154623038144462, "2": 3.1638715918708286e-05}, "score": 4.873718385856314}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878832136783526, "4": 0.011743997734699793, "3": 0.00032289834682082625, "1": 4.3634606298399726e-05, "2": 0}, "score": 4.987435588548107}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921327798492281, "4": 0.0068148378992041484, "1": 0.0005647971035917312, "3": 0.00048372678714576667, "2": 2.5424128166875586e-06}, "score": 4.989950879649567}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8377135857799677, "4": 0.14524193641591346, "3": 0.014739038868673717, "1": 0.002209607016174451, "2": 8.491549266191655e-05}, "score": 4.816184804698968}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8822518407519272, "4": 0.10660856749316022, "3": 0.010279815156520456, "1": 0.0008044805245230991, "2": 4.576225194586108e-05}, "score": 4.86947534894109}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9743098809630889, "4": 0.02419712631946598, "3": 0.0012917737565304491, "1": 0.00019296610620494863, "2": 4.38565750172355e-06}, "score": 4.972434198167756}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972348513855631, "4": 0.0026547377634367794, "3": 6.969625304250506e-05, "1": 3.826495858590437e-05, "2": 0}, "score": 4.9970528026765635}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9882871883548203, "4": 0.011069795564023556, "3": 0.0004644377610355847, "1": 0.00017201497861010892, "2": 0}, "score": 4.98731318573157}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8690581065124384, "4": 0.10984387934516678, "3": 0.019405689164536874, "1": 0.001452593063549721, "2": 0.00023244126232867062}, "score": 4.844835915037231}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7741911051423331, "4": 0.20112161583276789, "3": 0.02092070794028909, "1": 0.0035570611311835677, "2": 0.00013979115487723262}, "score": 4.742371388740039}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9731202817116025, "4": 0.02539839743648165, "3": 0.00138792090970719, "1": 8.474176369213265e-05, "2": 0}, "score": 4.971486546814768}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9261722143570342, "4": 0.07084268248300923, "3": 0.002446109440688429, "1": 0.0005237385230495009, "2": 8.356122953344328e-06}, "score": 4.922144539044027}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9423090543869312, "4": 0.05406456491823903, "3": 0.003171895247094377, "1": 0.00042755458223281027, "2": 1.9361848505845385e-05}, "score": 4.937822870093371}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9602129079452221, "4": 0.03619477527452202, "3": 0.002588082564581928, "1": 0.000985438340545606, "2": 1.2125680487926013e-05}, "score": 4.954650626703521}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9704759147919366, "4": 0.02697139281613202, "3": 0.0019059732661552296, "1": 0.0006337911970275179, "2": 7.831441228162512e-06}, "score": 4.966657831611818}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.99502605623059, "4": 0.004559886254297312, "3": 0.00037163736663933317, "1": 4.012259162990813e-05, "2": 0}, "score": 4.9945363360928265}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9946318877864957, "4": 0.005041919077640531, "1": 0.00021158494688405634, "3": 0.00011285203749137045, "2": 0}, "score": 4.993886026322777}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9925060660006728, "4": 0.007002178248329314, "3": 0.00036561123081378774, "1": 0.00012139031015846948, "2": 0}, "score": 4.991780998974552}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9916449976683447, "4": 0.008141933471186599, "3": 0.0001846967993169348, "1": 2.6415595066599898e-05, "2": 0}, "score": 4.991382993691033}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.963042906635031, "4": 0.03621873690482762, "3": 0.0006026692615622243, "1": 0.0001299697275013855, "2": 0}, "score": 4.96205582871734}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9770778162045415, "4": 0.02213920411897981, "3": 0.0006356725409097945, "1": 0.00014376378316447212, "2": 0}, "score": 4.976014310676792}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967595795318634, "4": 0.0031861349856962587, "3": 3.1358396368440836e-05, "1": 2.2656154977832435e-05, "2": 0}, "score": 4.996660522696887}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.971571122392217, "4": 0.02646629082671333, "3": 0.0015026350681319055, "1": 0.0004545896109384482, "2": 3.4220252629886496e-06}, "score": 4.968699753792601}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9668245378431216, "4": 0.030824029950409386, "3": 0.0020360594119451254, "1": 0.0002976590065385659, "2": 1.143535140854723e-05}, "score": 4.963878682359918}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959601761321247, "4": 0.0038701318606558905, "3": 0.00014887314358332098, "1": 1.963539015003612e-05, "2": 0}, "score": 4.995753575266045}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9187329972691959, "4": 0.06702285488982661, "3": 0.013607692787743595, "1": 0.0005706259167754441, "2": 4.610682828268208e-05}, "score": 4.903339029005279}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967548379578215, "4": 0.0031620911940111562, "3": 5.2000147648117626e-05, "1": 3.0117926460958545e-05, "2": 0}, "score": 4.996613433578217}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9899670353837998, "4": 0.009791942748420903, "3": 0.00020860751294722978, "1": 2.9034842025067256e-05, "2": 0}, "score": 4.989674667962992}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9615364261110787, "4": 0.034707027184867976, "3": 0.003116770217609942, "1": 0.0006276561960031232, "2": 9.398805041630093e-06}, "score": 4.956520492851931}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9668206357471614, "4": 0.030729161169714227, "3": 0.0016469359787089177, "1": 0.0007872463770705632, "2": 9.113142095107242e-06}, "score": 4.962800384978788}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9632575591107918, "4": 0.03412769002542295, "3": 0.0021567506901764718, "1": 0.00044467734775801047, "2": 6.945823599140027e-06}, "score": 4.959759005115479}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979880936023555, "4": 0.0019493985302721875, "1": 3.632980787770115e-05, "3": 2.5310784202185854e-05, "2": 0}, "score": 4.997854658809211}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9949425028237595, "4": 0.00450012187157665, "3": 0.00029749623158499794, "1": 0.0002561513697860392, "2": 0}, "score": 4.993880257373523}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9958865106702169, "4": 0.003957175760305814, "3": 0.00012224149531557646, "1": 3.272634980869499e-05, "2": 0}, "score": 4.995667430019383}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9923879442635485, "4": 0.007249041686678825, "3": 0.0002367570613866776, "1": 0.00012119484721022009, "2": 0}, "score": 4.991792623254807}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962060692105387, "4": 0.0033122965779025762, "3": 0.00029850944025106154, "1": 0.00018136916829983535, "2": 1.153792748532422e-06}, "score": 4.995361743698801}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971266250666341, "4": 0.0026178262006616177, "1": 0.00018101330882169009, "3": 7.216329650356204e-05, "2": 0}, "score": 4.9965137857013}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975270464999899, "4": 0.0024018968491039835, "3": 5.104321148310233e-05, "1": 1.9314643870339256e-05, "2": 0}, "score": 4.997418756348687}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9771687433884007, "4": 0.02127267273851869, "3": 0.0008421650849952892, "1": 0.000697462645877728, "2": 0}, "score": 4.974252658437711}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9909787696896927, "4": 0.008745363541679948, "3": 0.0002021420277407421, "1": 7.13109261748794e-05, "2": 0}, "score": 4.990565085924004}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9881611077535101, "4": 0.011093391592314346, "3": 0.00046435556282663757, "1": 0.00027127472640790773, "2": 0}, "score": 4.986892669002261}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984555025657053, "4": 0.0015150527835510036, "3": 2.054697150298266e-05, "1": 7.905063930387458e-06, "2": 0}, "score": 4.998412231441678}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9847575295564082, "4": 0.014323080813235271, "3": 0.0007675748183975262, "1": 0.00013632729261754434, "2": 0}, "score": 4.983596206325426}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.986269465632844, "4": 0.012967539573482222, "3": 0.0006122929582723195, "1": 0.0001493716593070828, "2": 7.85655842358887e-07}, "score": 4.985208022850687}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9845353795321549, "4": 0.014327321072683422, "3": 0.0010188676657052996, "1": 0.00011588537522577906, "2": 1.7524004924361538e-06}, "score": 4.983166131528213}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9519635554632188, "4": 0.040722435403273534, "3": 0.005220230609491011, "1": 0.0020641907871500834, "2": 2.295609682214222e-05}, "score": 4.940511077429556}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9914816083634251, "4": 0.008040640779695131, "3": 0.00033012110037095385, "1": 0.0001449535806856044, "2": 0}, "score": 4.990719277859976}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9476050428539756, "4": 0.04704647199161183, "3": 0.0048344834082211, "1": 0.0005060277744327092, "2": 6.298424721748165e-06}, "score": 4.9412414563673455}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9999280483736425, "4": 7.062559102762086e-05, "3": 9.798856066531255e-07, "1": 2.0483378327245463e-07, "2": 0}, "score": 4.999926595292251}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.991898268372436, "4": 0.007807558312928734, "3": 0.00022474143372992365, "1": 6.863575150661907e-05, "2": 4.402962681143399e-07}, "score": 4.991467091888489}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.991101708231178, "4": 0.008661433837178682, "3": 0.00020274855337757533, "1": 3.3345424213787125e-05, "2": 0}, "score": 4.99079968033059}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9955408058615354, "4": 0.0043154356404272575, "3": 7.858466337684263e-05, "1": 6.462604855789982e-05, "2": 0}, "score": 4.99526888824695}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999708403221517, "4": 2.7944560295664122e-05, "1": 6.874594437876782e-07, "3": 1.170037326109315e-07, "2": 0}, "score": 4.999969071581764}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9221176504880233, "4": 0.07581977018188744, "3": 0.0019217385651123192, "1": 0.00013433793898839696, "2": 3.827736200072087e-06}, "score": 4.919787703148238}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9703483919606327, "4": 0.028223009331215267, "3": 0.0011682118880819803, "1": 0.0002520001185541464, "2": 4.799206337863836e-06}, "score": 4.968418055499316}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9822379975122517, "4": 0.01644812154638902, "3": 0.0010511305287336003, "1": 0.0002592973721166327, "2": 2.917801897471095e-06}, "score": 4.98040366401327}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948561286499195, "4": 0.005011289559001511, "1": 8.618262213331582e-05, "3": 4.190308944430856e-05, "2": 0}, "score": 4.994560149315576}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9908903862528728, "4": 0.008633644993181642, "3": 0.0003655727339780772, "1": 0.00010918498544847304, "2": 7.22667940768858e-07}, "score": 4.990196296805444}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9809399640649912, "4": 0.01816955296124998, "3": 0.0007841005447359415, "1": 0.00010219334497258467, "2": 2.2934920253060774e-06}, "score": 4.979846553890599}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9349125252055239, "4": 0.05821844791418538, "3": 0.00601704081190859, "1": 0.0007760590075614726, "2": 4.8220153591131e-05}, "score": 4.92649653741736}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9782880623854313, "4": 0.019886946843209307, "3": 0.0017555583930367246, "1": 6.684513713460924e-05, "2": 1.4679744977907378e-06}, "score": 4.9763301254057835}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9916460547624757, "4": 0.007679022642591798, "3": 0.0003987470906768697, "1": 0.00027018571556239025, "2": 0}, "score": 4.990442683067496}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9959641978274357, "4": 0.0037908852953554882, "3": 0.0002057530283345457, "1": 3.779102187819875e-05, "2": 0}, "score": 4.995646438583776}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6113451840432804, "4": 0.3294275591647947, "3": 0.02972202873065915, "1": 0.029405692527374603, "2": 9.226137282375389e-05}, "score": 4.493225142783982}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9253683634368391, "4": 0.0718525195691188, "3": 0.002512032732518234, "1": 0.0002625757358557671, "2": 3.9848296278446455e-06}, "score": 4.922061116717255}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9463677210402007, "4": 0.05253240824137581, "3": 0.0010584189933314973, "1": 3.979202669659013e-05, "2": 0}, "score": 4.9451914946995865}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9801958405366828, "4": 0.019460439844255165, "3": 0.0003349775645079385, "1": 7.96479780787339e-06, "2": 0}, "score": 4.9798377301642365}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9988108392127215, "4": 0.0011495393293911127, "1": 2.5104486067690796e-05, "3": 1.4239453934671851e-05, "2": 0}, "score": 4.99872156346368}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9957399303501875, "4": 0.003906583781757991, "3": 0.000214314927690272, "1": 0.00013793182729175728, "2": 6.645431665200295e-07}, "score": 4.995111062615159}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9846811251838358, "4": 0.014967625655156098, "3": 0.0002730873091971246, "1": 7.31117840270596e-05, "2": 0}, "score": 4.984193672767318}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9973918398752134, "4": 0.0024134324298574943, "3": 0.00016285505270189764, "1": 3.0313542442567263e-05, "2": 0}, "score": 4.997139598835318}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998834704001013, "4": 0.0001120389476773498, "3": 2.8328734728748825e-06, "1": 1.2736013014368385e-06, "2": 0}, "score": 4.999877200852995}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9861978147726812, "4": 0.012967319127183276, "3": 0.00067107564004906, "1": 0.00015996268318924943, "2": 2.594551211106045e-06}, "score": 4.9850428767608195}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9644795881517552, "4": 0.028641845531980313, "3": 0.006732529173860847, "1": 0.00014123632595812024, "2": 2.925807637525386e-06}, "score": 4.9573192933668535}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9220379829647077, "4": 0.06437301213057937, "3": 0.011746880065391397, "1": 0.0017531712292065513, "2": 8.350558851698006e-05}, "score": 4.9048695077832845}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9798795990278943, "4": 0.01859367332392557, "3": 0.0013343774840044705, "1": 0.00018235978164573763, "2": 3.795600215767746e-06}, "score": 4.97799660947462}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974041754942926, "4": 0.002373816456050168, "3": 0.00012690916038426406, "1": 9.436823831077517e-05, "2": 0}, "score": 4.996994890074252}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9639881509430364, "4": 0.030456473896060387, "3": 0.0047440574847564445, "1": 0.0007853838333517036, "2": 2.313539180854663e-05}, "score": 4.956844348856619}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8612777901043334, "4": 0.11314239735645357, "3": 0.02188012693562065, "1": 0.0035199763786691583, "2": 0.00017383464963761593}, "score": 4.8284949317892805}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9748912038551861, "4": 0.02290853340640267, "3": 0.0017026818706624169, "1": 0.0004868565679134622, "2": 7.890902849962676e-06}, "score": 4.971714923729219}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9815099379985196, "4": 0.01754829473303563, "3": 0.0007919692441878669, "1": 0.0001427629493581747, "2": 0}, "score": 4.980296576366094}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9927089172521706, "4": 0.006464394042992118, "3": 0.00043911026645216447, "1": 0.0003834006622676086, "2": 1.9740782054143125e-06}, "score": 4.9911178409668215}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9853840178011481, "4": 0.013816340404704742, "3": 0.0006912762715437669, "1": 0.0001007711957108577, "2": 0}, "score": 4.984397903781946}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9860274105691853, "4": 0.013050974156392925, "3": 0.000811116146637551, "1": 0.00010641468219734525, "2": 2.83231545176761e-06}, "score": 4.98489261895878}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9316865226151272, "4": 0.0613292063547177, "3": 0.005968396384332483, "1": 0.0009604967110189454, "2": 3.9124918193777806e-05}, "score": 4.922773384112489}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9826356329131598, "4": 0.016109759669481978, "3": 0.0010426382491397108, "1": 0.00020774130049066642, "2": 2.9948991492566125e-06}, "score": 4.980964990463258}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959418471476825, "4": 0.003920917878149684, "1": 6.982848757583387e-05, "3": 6.554274714659136e-05, "2": 0}, "score": 4.995668674604792}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9775122961696947, "4": 0.01944232282898795, "3": 0.0016423863554237636, "1": 0.0013523270902007529, "2": 0}, "score": 4.971862170424314}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9596632224657159, "4": 0.0361417092390024, "3": 0.0035015533312928986, "1": 0.0006813689648020591, "2": 9.397902799654394e-06}, "score": 4.954101388396996}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9779293860078528, "4": 0.020285092952649762, "3": 0.0012959071851671518, "1": 0.0004797588385523504, "2": 5.845069924388465e-06}, "score": 4.975186422611932}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9593999154904618, "4": 0.03158566185896957, "3": 0.005654011419456047, "1": 0.003317204064856995, "2": 3.9418709262100875e-05}, "score": 4.943719029696869}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878176036177856, "4": 0.011708505915395701, "3": 0.00025872573385122785, "1": 0.00020982808612782648, "2": 0}, "score": 4.986934660547289}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.996110832876521, "4": 0.003634869753001359, "3": 0.00015362438397697933, "1": 9.959446173400624e-05, "2": 0}, "score": 4.995659498950771}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9816258258287953, "4": 0.016336643937948488, "3": 0.0011723077933432384, "1": 0.0008306890673283014, "2": 1.2051300241378182e-05}, "score": 4.977959334785497}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9917217866884129, "4": 0.007289888704139427, "1": 0.0005892476525199046, "3": 0.00039579387496157446, "2": 1.6222296951459412e-06}, "score": 4.989556648901931}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9891591135834578, "4": 0.010394286487490969, "3": 0.0003457094069833719, "1": 9.739185256933943e-05, "2": 0}, "score": 4.988524687139938}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991106126395997, "4": 0.0007390612929965712, "1": 0.00013425225871823503, "3": 1.5025391820192442e-05, "2": 0}, "score": 4.998693877519129}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975086635426955, "4": 0.0023195965715455628, "1": 0.00011235702876091041, "3": 5.8843098727266446e-05, "2": 0}, "score": 4.99711328755783}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8984705411464731, "4": 0.08089604852934694, "3": 0.019296230751387047, "1": 0.0012263260875980972, "2": 8.841861796784231e-05}, "score": 4.875338132991149}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9930349080757733, "4": 0.006737502309258451, "3": 0.00017269819923395905, "1": 5.1716276504055035e-05, "2": 0}, "score": 4.99271021304017}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9390119204683315, "4": 0.0550773344746017, "3": 0.005482030047481006, "1": 0.00038888600638628957, "2": 2.5524902849828114e-05}, "score": 4.93232551867377}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9658700699242401, "4": 0.03192447250961119, "3": 0.0018227425801060919, "1": 0.00036225350542453197, "2": 0}, "score": 4.962980270830008}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9935281863825562, "4": 0.00605045380900249, "3": 0.0002547930273064513, "1": 0.00016429137988506677, "2": 1.1539554447797822e-06}, "score": 4.992779324652915}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"5": 0.941827897633611, "4": 0.048549042809521104, "3": 0.009017065774425093, "1": 0.0005572213501168884, "2": 3.772735989744234e-05}, "score": 4.931073996868771}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9835132755230958, "4": 0.014634209128968326, "3": 0.0013152187202459622, "1": 0.0005306114697118588, "2": 4.5094651657831975e-06}, "score": 4.980599336946311}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9821929148050373, "4": 0.015441703656896472, "3": 0.0021027337397530816, "1": 0.00023177372164184416, "2": 0}, "score": 4.979425098745951}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9806849214453137, "4": 0.018601770771977326, "3": 0.0005581374498612457, "1": 0.00014420942134271545, "2": 0}, "score": 4.979704894190071}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9974893258276853, "4": 0.0023903308300576042, "1": 7.167822875873633e-05, "3": 4.660121240017394e-05, "2": 0}, "score": 4.997229748112581}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9979996112498074, "4": 0.0018972154887297438, "3": 5.8734398362176e-05, "1": 4.324153786630392e-05, "2": 0}, "score": 4.997812346943749}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9918986195044851, "4": 0.007531635973583323, "3": 0.0003540196988180606, "1": 0.00021197440960258487, "2": 0}, "score": 4.990912392908085}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9986692186758465, "4": 0.0012269535138424862, "3": 6.423932473359648e-05, "1": 3.831036774909828e-05, "2": 0}, "score": 4.998491324437428}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9950037555585141, "4": 0.0047156760045138435, "3": 0.00014463922781544507, "1": 0.0001338664361825829, "2": 0}, "score": 4.994459568366472}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9978947864769563, "4": 0.001950041937943604, "1": 0.00010240039376550507, "3": 5.0794981379611224e-05, "2": 0}, "score": 4.997538761660311}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9902613032534402, "4": 0.008619100069902066, "3": 0.0010924023687241926, "1": 2.5718705251649693e-05, "2": 8.443354235783661e-07}, "score": 4.989090680478676}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9433343587494528, "4": 0.0551631952938506, "3": 0.0014362122684865074, "1": 6.223717922850094e-05, "2": 0}, "score": 4.94171519851653}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9924592144681735, "4": 0.007356735432558708, "3": 0.000116242736170952, "1": 6.54562223398281e-05, "2": 0}, "score": 4.992148935746783}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991555885861422, "4": 0.0008239848616562183, "3": 1.1344607920540087e-05, "1": 8.485616536372825e-06, "2": 0}, "score": 4.999119382931221}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982093306648331, "4": 0.0017615855408392445, "3": 2.0760134933516825e-05, "1": 7.188694315571912e-06, "2": 0}, "score": 4.998168137332931}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8913867792719162, "4": 0.10153811842669506, "3": 0.004816161680532442, "1": 0.0022184771210498433, "2": 3.362425084476699e-05}, "score": 4.879853955266794}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9869927441441935, "4": 0.012035556123084873, "3": 0.0007441034403997373, "1": 0.00022108175339225877, "2": 0}, "score": 4.985591816119872}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9939571684942419, "4": 0.005486028453030242, "3": 0.000334445540607162, "1": 0.0002205661297229963, "2": 0}, "score": 4.992962803340553}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9973667006314942, "4": 0.0022952865152860613, "3": 0.0001764249472625848, "1": 0.0001600630112411665, "2": 7.919354111783348e-07}, "score": 4.996709233326992}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9862550898738838, "4": 0.013324320561318095, "3": 0.0002648269405074547, "1": 0.00014983685336733354, "2": 0}, "score": 4.9855465924966165}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9585980600415457, "4": 0.03974342739924597, "3": 0.0013763489145420112, "1": 0.00027257915744695663, "2": 0}, "score": 4.956413140384183}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9941012344383963, "4": 0.005507269126516651, "3": 0.00024860009419149117, "1": 0.00014008838683879132, "2": 0}, "score": 4.993435158703973}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979271952330391, "4": 0.0019994992595401004, "3": 5.1597775338558575e-05, "1": 2.0801218317824478e-05, "2": 0}, "score": 4.9978140983349615}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969738745757396, "4": 0.002825009363149562, "1": 0.0001233767346906813, "3": 7.583770208414138e-05, "2": 0}, "score": 4.996529801694907}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9876219817626035, "4": 0.011545356009137163, "3": 0.0005055164388764353, "1": 0.0003224482176650946, "2": 0}, "score": 4.986153753198711}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9949093408483694, "4": 0.004565433992057597, "1": 0.0003331595678574898, "3": 0.00018939893504700295, "2": 0}, "score": 4.993723113128117}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994673274584136, "4": 0.005144508211392046, "3": 0.00011749473898244056, "1": 6.384655062793981e-05, "2": 0}, "score": 4.994365111172447}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9803171492382833, "4": 0.01677392469195274, "3": 0.002105233271864007, "1": 0.0007948683933258873, "2": 6.732426025451276e-06}, "score": 4.9758158873202945}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999454145632731, "4": 0.0004937619695086205, "1": 4.3063361654381956e-05, "3": 8.02933377858357e-06, "2": 0}, "score": 4.999317925234445}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996130158676828, "4": 0.00035255292681146536, "1": 2.6796721768508383e-05, "3": 7.041108097270241e-06, "2": 0}, "score": 4.999526177688765}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9825139822915355, "4": 0.016833562796274303, "3": 0.0006126182946934572, "1": 3.682483780890089e-05, "2": 0}, "score": 4.98179384643018}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9914614462941818, "4": 0.008366116338088078, "3": 0.00011944781219682454, "1": 4.750654818018757e-05, "2": 0}, "score": 4.991204913621274}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9893885855445738, "4": 0.010093496231772062, "3": 0.0003646213281632037, "1": 0.00015060831976513195, "2": 0}, "score": 4.9885747971153185}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947759057909998, "4": 0.004970867036822057, "3": 0.00013016691103563178, "1": 0.00012067591428767162, "2": 0}, "score": 4.994286081859993}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9949661062242201, "4": 0.004900320342412121, "3": 8.810114751192367e-05, "1": 4.178880822906482e-05, "2": 0}, "score": 4.994756302814606}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8867362690737736, "4": 0.10811201645165494, "3": 0.004795993486158129, "1": 0.00033885387185171286, "2": 1.3088769310432709e-05}, "score": 4.880900864782801}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9887729549878547, "4": 0.010724382409734796, "3": 0.0002694518089814884, "1": 0.00023118322038252125, "2": 0}, "score": 4.987811956378623}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9019786489381034, "4": 0.08643323610501778, "3": 0.008354344299721109, "1": 0.003193100789432342, "2": 3.769402364808608e-05}, "score": 4.883972244786357}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9862251742519602, "4": 0.013499921612987244, "3": 0.0001944449438528784, "1": 7.91215721814336e-05, "2": 0}, "score": 4.98579468320928}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9865623418834694, "4": 0.012972086789937151, "3": 0.0003097100564273608, "1": 0.00015339350656681127, "2": 0}, "score": 4.985794884016073}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9765512721517683, "4": 0.021359903130273108, "3": 0.0012407242466358364, "1": 0.0008323476132599847, "2": 0}, "score": 4.9728288298998296}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9750182307051208, "4": 0.022960167781519547, "3": 0.0011798198755445888, "1": 0.0008183612442163796, "2": 0}, "score": 4.971406077809612}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9576783624059713, "4": 0.03967940466818366, "3": 0.002152852439728513, "1": 0.00046599563072928437, "2": 1.3430759453445566e-05}, "score": 4.9541101588592005}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9859756070359262, "4": 0.01199136825627748, "3": 0.0011368220327405056, "1": 0.0008805010830403315, "2": 7.785877829088522e-06}, "score": 4.982189484729645}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.991068331956502, "4": 0.00834029242730636, "3": 0.0004003203325402488, "1": 0.0001865493019866313, "2": 0}, "score": 4.9901128251482385}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9731190400109152, "4": 0.0247327401727084, "3": 0.001840888395945067, "1": 0.00029878150625838057, "2": 7.732649489128906e-06}, "score": 4.970367134844006}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9931903464886728, "4": 0.006559086098397154, "3": 0.00019679184740338507, "1": 5.2915566480256736e-05, "2": 0}, "score": 4.992835661779551}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9831600993388979, "4": 0.015322382670004945, "3": 0.0012607628559426752, "1": 0.00024888863762358827, "2": 5.763146298549586e-06}, "score": 4.981143207966263}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902291549420804, "4": 0.008912481223536632, "3": 0.0006548138245895191, "1": 0.00019966651662060422, "2": 2.7146704314347537e-06}, "score": 4.988971068158642}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916109987108022, "4": 0.007687601828142439, "3": 0.00045382994526165757, "1": 0.0002446013048738408, "2": 1.8602456668671308e-06}, "score": 4.990420741711353}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9880372663182635, "4": 0.011189534020708944, "1": 0.0004315589242435875, "3": 0.00033617600861201604, "2": 0}, "score": 4.986411804009295}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.981893430921362, "4": 0.016658044934499013, "3": 0.0011550134385128576, "1": 0.0002894844429633934, "2": 2.990772029632793e-06}, "score": 4.979864997250927}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9871486233333163, "4": 0.01085431697769077, "1": 0.0010472690581725208, "3": 0.0009420573538973445, "2": 5.016680991465235e-06}, "score": 4.983057396012641}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9780568586092272, "4": 0.021154170630465697, "3": 0.0005285104393807316, "1": 0.00025683928984825106, "2": 0}, "score": 4.976761367183568}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.974628769225595, "4": 0.02356257808092707, "3": 0.001035150968103325, "1": 0.0007649615399321847, "2": 4.308503198056789e-06}, "score": 4.971294226839832}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9982120600723374, "4": 0.0016978254394492257, "3": 5.120778431873729e-05, "1": 3.774928586241875e-05, "2": 0}, "score": 4.998048759590063}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.997227265349179, "4": 0.0025135464369182934, "1": 0.0001641734610122506, "3": 9.251081512594972e-05, "2": 0}, "score": 4.996644729687393}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983303803682299, "4": 0.0015727473255631296, "3": 8.76337815699138e-05, "1": 8.386250822433819e-06, "2": 0}, "score": 4.998218438589628}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957913413316483, "4": 0.00400265935507854, "3": 0.00012029710501336606, "1": 8.352538168685658e-05, "2": 0}, "score": 4.995422634944017}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984052390847726, "4": 0.0015467916445664816, "1": 2.6937639808689844e-05, "3": 1.917019171834051e-05, "2": 0}, "score": 4.998307114261558}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9808539374406713, "4": 0.01846315046609691, "3": 0.0003698696173385041, "1": 0.00031084909146415697, "2": 1.2024541074229623e-06}, "score": 4.979550086306608}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969253037899339, "4": 0.0028966699351888102, "1": 0.00010365971443810654, "3": 7.366034229493752e-05, "2": 0}, "score": 4.996541368079921}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9588269392277713, "4": 0.03685752776256479, "3": 0.003992901976651101, "1": 0.00029703843997836896, "2": 1.6844388219336154e-05}, "score": 4.9539175782210965}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9840075000075877, "4": 0.015489277014204514, "3": 0.00030772254773937276, "1": 0.00019350039580357846, "2": 0}, "score": 4.983121242549002}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9868855773555288, "4": 0.011995268483376974, "3": 0.0009600007425625839, "1": 0.00015011768572250069, "2": 0}, "score": 4.985484128127068}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9274882574610905, "4": 0.0675881707601983, "3": 0.004667447176093555, "1": 0.000231128898708778, "2": 0}, "score": 4.922150473389062}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.978869479073484, "4": 0.02041962767013001, "3": 0.0005880074147653507, "1": 0.0001155532610107456, "2": 0}, "score": 4.977941982714106}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9686708740988621, "4": 0.028909269249832382, "3": 0.002285222923216608, "1": 0.0001258712498526177, "2": 0}, "score": 4.966016502124663}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941449402646261, "4": 0.0057869123645950095, "3": 6.148046966558168e-05, "1": 5.757927252587917e-06, "2": 0}, "score": 4.9940670895942025}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997432875115196, "4": 0.0025384066447664156, "3": 2.07344083199961e-05, "1": 5.836110460789954e-06, "2": 0}, "score": 4.997396774505749}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8971998675159442, "4": 0.0981275221274701, "3": 0.004096675040558094, "1": 0.0005599957855875025, "2": 1.1444566294904037e-05}, "score": 4.891404322816503}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8861425807233368, "4": 0.1077864633806592, "3": 0.005612028715229133, "1": 0.00043196223177017817, "2": 1.8771815285031445e-05}, "score": 4.8792043251208295}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.964062598766598, "4": 0.03339082557884349, "3": 0.0020230581030057553, "1": 0.0005160305958281215, "2": 4.335298898721294e-06}, "score": 4.960485805399954}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9644909044571499, "4": 0.03438930376560833, "3": 0.0008567066471561839, "1": 0.0002561452222269354, "2": 3.2268955917634653e-06}, "score": 4.962862883473827}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975200491715589, "4": 0.002381975722896501, "1": 6.97872660257807e-05, "3": 2.706581677218958e-05, "2": 0}, "score": 4.997284740532873}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9591629643424743, "4": 0.037095422489997275, "3": 0.002941717748654371, "1": 0.000766143935900848, "2": 2.2283144885861606e-05}, "score": 4.953889188020052}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9849642656461081, "4": 0.014180195088054244, "3": 0.000610575868138208, "1": 0.0002399919924429364, "2": 2.3810118823138357e-06}, "score": 4.9836314997693965}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9675201378302332, "4": 0.030237814563739376, "3": 0.0020490909975478654, "1": 0.00018077742129907673, "2": 6.208141389327548e-06}, "score": 4.9649220598798145}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943829913169401, "4": 0.005506307641267265, "3": 8.813789335141125e-05, "1": 2.058843597968165e-05, "2": 0}, "score": 4.994235051443997}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9957985570610091, "4": 0.0039488416351554385, "3": 0.00016749082237354658, "1": 8.232176713618262e-05, "2": 0}, "score": 4.99538687678687}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"5": 0.931247658177737, "4": 0.06081926996567752, "3": 0.007330606678507566, "1": 0.0005848100876113898, "2": 1.4962477362954345e-05}, "score": 4.922135179234935}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8787873088765539, "4": 0.11767927070269604, "3": 0.0028231697512770427, "1": 0.0006961588436735643, "2": 7.784468712730338e-06}, "score": 4.87386560543925}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9454223973802881, "4": 0.052611718441090714, "3": 0.0017219164384932137, "1": 0.0002365821625513923, "2": 3.52495107933212e-06}, "score": 4.942987325073836}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9517656885093652, "4": 0.04711876262802752, "3": 0.0008116186264439755, "1": 0.00029737606738224054, "2": 0}, "score": 4.950068168587904}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.959139385529142, "4": 0.03947733773294425, "3": 0.0009614346134308245, "1": 0.0004104860141222277, "2": 0}, "score": 4.956957360186738}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9987286697259288, "4": 0.0012452922968933739, "1": 1.3325993920999054e-05, "3": 1.1344857504659748e-05, "2": 0}, "score": 4.998678712206046}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995572823964257, "4": 0.004283502341191152, "1": 8.44580159277075e-05, "3": 5.745790300184434e-05, "2": 0}, "score": 4.995263741463815}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9822700798936609, "4": 0.017077035009201418, "3": 0.00036233259399696987, "1": 0.00028639316167383753, "2": 2.0544035406603104e-06}, "score": 4.981046524049598}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.992524502567587, "4": 0.006955531755161852, "1": 0.00040952934363912784, "3": 0.000104140667563442, "2": 0}, "score": 4.9911980141207914}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9897323727054107, "4": 0.009889859892799363, "1": 0.00022285259812785044, "3": 0.0001505792551642413, "2": 0}, "score": 4.988917523155745}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.984502678240354, "4": 0.014558926038880184, "3": 0.0007967731098034397, "1": 0.00013923728415321532, "2": 1.5561853807579549e-06}, "score": 4.9832858961904005}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9863574911517917, "4": 0.012886323806899974, "3": 0.0006163084433654189, "1": 0.00013720807345219495, "2": 0}, "score": 4.985332187871144}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9920926578187712, "4": 0.007610925486367726, "3": 0.00021895857528268133, "1": 7.540250957622022e-05, "2": 0}, "score": 4.991649530159452}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9795561138295619, "4": 0.019215223951463883, "3": 0.0010504669493519472, "1": 0.00017475999194025064, "2": 1.9117624360164047e-06}, "score": 4.977979033345485}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.976940807257954, "4": 0.022470588559584656, "3": 0.00043120514785565116, "1": 0.0001516527788342309, "2": 0}, "score": 4.976060252465455}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9733931945782709, "4": 0.022696149373661472, "3": 0.003447520506814269, "1": 0.0004436150393986394, "2": 1.3687480158444041e-05}, "score": 4.968593103817534}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.858539713964945, "4": 0.12746094181765436, "3": 0.01306976933412778, "1": 0.000865025994533601, "2": 5.993853125277595e-05}, "score": 4.8427588750043995}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9578385513385436, "4": 0.037955752712554996, "3": 0.003772171683510604, "1": 0.0004186208250108605, "2": 8.957243709592142e-06}, "score": 4.952798268218471}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.986841461595625, "4": 0.011746185845293942, "3": 0.0009743090547312562, "1": 0.0004345072185209221, "2": 2.7776980856773157e-06}, "score": 4.9845588223634145}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9475203733882478, "4": 0.03857649213813041, "3": 0.01328749382548715, "1": 0.0005780550220294287, "2": 2.7562952159829343e-05}, "score": 4.932452934264082}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8728240498668863, "4": 0.1079152912382874, "3": 0.015701877308287107, "1": 0.0033963226710985238, "2": 0.00015490725112258396}, "score": 4.846629783506986}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9849804541593289, "4": 0.01348610207146648, "3": 0.001292548148566134, "1": 0.00023008632347483582, "2": 7.006025454168222e-06}, "score": 4.982987373557498}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9776362467217024, "4": 0.017516909630251293, "3": 0.003305910671709253, "1": 0.001514206105713502, "2": 1.9714404431358708e-05}, "score": 4.9697550892987685}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9911773589383213, "4": 0.008197570902496376, "3": 0.00046968467155836696, "1": 0.000150455003281124, "2": 0}, "score": 4.990261191724221}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9434998718477363, "4": 0.050196207647933144, "3": 0.0035226441231876638, "1": 0.0027226805163297002, "2": 3.9226736111233864e-05}, "score": 4.931748779865372}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"5": 0.874829953821857, "4": 0.10952664784692634, "3": 0.011951087506706311, "1": 0.003646994045021314, "2": 4.179474266116807e-05}, "score": 4.851857294967529}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9742474141133448, "4": 0.02364875046265576, "3": 0.0016866656282721246, "1": 0.0004098640658282765, "2": 3.8079978714624633e-06}, "score": 4.971326937733184}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.923861577927942, "4": 0.06536227642585221, "3": 0.0087952251618532, "1": 0.0019527610203246913, "2": 2.224124744504468e-05}, "score": 4.909168967869087}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9718333789978741, "4": 0.026943518809305147, "3": 0.001001859004793018, "1": 0.00021665030542869588, "2": 2.3508607976645446e-06}, "score": 4.970179042517763}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9856610767675189, "4": 0.013784286431139684, "3": 0.0004219834342628818, "1": 0.00012752641989105732, "2": 0}, "score": 4.984861563406803}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8294571651882019, "4": 0.13891713148529808, "3": 0.03070682304683749, "1": 0.0008079317264347063, "2": 9.221765129585609e-05}, "score": 4.796157024398616}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9411371037093846, "4": 0.05213668246220718, "3": 0.005675649345760195, "1": 0.001008239034545165, "2": 3.0170075569708657e-05}, "score": 4.932387730629061}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9812976456381203, "4": 0.01601618028366557, "3": 0.0020330909672700613, "1": 0.0006457391036988929, "2": 5.2493620659051225e-06}, "score": 4.977318885771913}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9645739670968704, "4": 0.03240785653275084, "3": 0.0026472180046131387, "1": 0.0003610290976395467, "2": 8.531025337429383e-06}, "score": 4.960827943219407}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.987952781381833, "4": 0.010747193803721621, "3": 0.0010362640428523307, "1": 0.000258272326668395, "2": 3.7978288871454616e-06}, "score": 4.9861357718781525}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.990624292611277, "4": 0.0081598744186163, "3": 0.0010413904371129312, "1": 0.00016891988646865812, "2": 3.0716520932112868e-06}, "score": 4.9890724234215735}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9971274570694371, "4": 0.00276738900715904, "1": 5.743819832066067e-05, "3": 4.6656420912645614e-05, "2": 0}, "score": 4.996909542083998}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9899764915940845, "4": 0.009373937939466169, "3": 0.0005008975343762604, "1": 0.00014664835203586995, "2": 1.5410955474681388e-06}, "score": 4.989033044994644}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964144486960115, "4": 0.003372911368515045, "3": 0.00012964624616559973, "1": 8.204374314070743e-05, "2": 0}, "score": 4.996039617404441}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995252336372336, "4": 0.0004454961290911113, "1": 2.2569186752885028e-05, "3": 6.427409358789546e-06, "2": 0}, "score": 4.999451372155056}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9954126312658603, "4": 0.004423940784103855, "3": 0.00014973162994189865, "1": 1.1833897206887893e-05, "2": 0}, "score": 4.995229251482033}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9972030779949129, "4": 0.0026665840705336033, "3": 9.784763833285676e-05, "1": 3.073744314864766e-05, "2": 0}, "score": 4.997014765647529}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9872690963791705, "4": 0.011967220402944819, "3": 0.000490461388849094, "1": 0.00026943941448335053, "2": 0}, "score": 4.985974046109451}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9966634153115996, "4": 0.0031974744984764993, "3": 7.940533504229605e-05, "1": 5.7972836113228823e-05, "2": 0}, "score": 4.996411817272187}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.989273310681292, "4": 0.01005420524155283, "1": 0.0003574297924040588, "3": 0.00030856748083916356, "2": 0}, "score": 4.987898862129444}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9663966048510172, "4": 0.03239739696492713, "3": 0.0007968811595627373, "1": 0.00038535456478305016, "2": 0}, "score": 4.964466578095309}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9740156224420587, "4": 0.02514681074050651, "3": 0.0007675748183975262, "1": 6.322915815466622e-05, "2": 0}, "score": 4.97306494083256}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9659600497415737, "4": 0.03310785544942972, "3": 0.0008160262780712506, "1": 0.00010987073714793345, "2": 0}, "score": 4.964820391009875}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9760895838984448, "4": 0.0230293221253706, "3": 0.0006552901783840082, "1": 0.00020707945453762167, "2": 0}, "score": 4.97483130843249}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9972189662589648, "4": 0.002689879989318103, "1": 5.582241872496847e-05, "3": 3.105697925887099e-05, "2": 0}, "score": 4.997024703659795}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9444641928330852, "4": 0.04882023502089141, "3": 0.004214235837210079, "1": 0.0024766421698811177, "2": 1.2090264693348758e-05}, "score": 4.9328076069466125}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9636586833322708, "4": 0.03305771188382597, "3": 0.002583783710324243, "1": 0.0006923429033544008, "2": 4.073956164646289e-06}, "score": 4.958992987616966}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9645445866212996, "4": 0.03263979922826406, "3": 0.002231714845538422, "1": 0.0005754229053155554, "2": 0}, "score": 4.9605947454447135}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9471171661063673, "4": 0.04632397654431205, "1": 0.003337321632932562, "3": 0.0032080820904913055, "2": 9.590063956584272e-06}, "score": 4.933881547098367}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982703911004486, "4": 0.0016817484209359721, "3": 2.735601845787699e-05, "1": 1.6771525839716987e-05, "2": 0}, "score": 4.998196446706244}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9900244016756896, "4": 0.009611557484355816, "3": 0.00021312621693155812, "1": 0.00014824963235327045, "2": 0}, "score": 4.989369163221286}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8190808926353265, "4": 0.16831076780572543, "3": 0.012159992733722624, "1": 0.0004278709185685868, "2": 1.722790681007912e-05}, "score": 4.80560544793865}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9294186554119004, "4": 0.06639921797858846, "3": 0.0035677030272548314, "1": 0.0005996454464470155, "2": 9.63368256258151e-06}, "score": 4.9240375023479075}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969982868766096, "4": 0.0029013051253634885, "1": 6.729820454835498e-05, "3": 3.157881732388573e-05, "2": 0}, "score": 4.996766339471138}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9582586000654426, "4": 0.03926822151737612, "3": 0.0020347486118067796, "1": 0.00043022983158866915, "2": 7.192908124966394e-06}, "score": 4.9549197378094965}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7745164731126618, "4": 0.17114473105822234, "3": 0.05234434345181779, "1": 0.0016748092513180909, "2": 0.00031645895779559185}, "score": 4.716517065502142}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9850499740705743, "4": 0.014518871398245176, "3": 0.0003665961956497481, "1": 6.235915900466109e-05, "2": 0}, "score": 4.984498465483826}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9848665521884695, "4": 0.014524279232830195, "3": 0.0005368223701603964, "1": 6.887901487459445e-05, "2": 0}, "score": 4.98412650493087}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903545907571331, "4": 0.009298951752134198, "3": 0.00027317498429447703, "1": 7.173979093991088e-05, "2": 0}, "score": 4.989867723484297}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9856725390868282, "4": 0.013978977291037125, "3": 0.000279632868242005, "1": 6.599081449115108e-05, "2": 0}, "score": 4.98519775138098}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9659140054553509, "4": 0.03237800321069404, "3": 0.0011836685767384373, "1": 0.0005184071088296881, "2": 4.015271867124714e-06}, "score": 4.96316891539198}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9634700887298525, "4": 0.0346396499745414, "3": 0.0017241265578658992, "1": 0.00015879110890212913, "2": 4.949524730666906e-06}, "score": 4.961261991157101}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9822072912679453, "4": 0.016881638955627488, "3": 0.0006297691716020127, "1": 0.00027514151298015186, "2": 3.715255897249736e-06}, "score": 4.980747063830538}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9832322246429168, "4": 0.016370104565331126, "3": 0.00032549189395167995, "1": 6.707628528016117e-05, "2": 0}, "score": 4.982710518284119}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9871830097737837, "4": 0.012170021565048582, "3": 0.0004376631532370187, "1": 0.00020605447137048974, "2": 0}, "score": 4.986130389152385}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8539875019667598, "4": 0.12620651573222658, "3": 0.019275540855081676, "1": 0.00045702429799694255, "2": 5.2239376937031825e-05}, "score": 4.833254055927393}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9858997075832286, "4": 0.013488854865812366, "3": 0.0005720838422304051, "1": 3.777103571443156e-05, "2": 0}, "score": 4.9852158699084255}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9847035564753589, "4": 0.014951958266467592, "3": 0.0003117877157399917, "1": 3.0083160337197495e-05, "2": 0}, "score": 4.984304092625605}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947234089720683, "4": 0.005117697746215009, "3": 0.00011892422885069224, "1": 3.758404247173739e-05, "2": 0}, "score": 4.994494104494579}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9776908199001175, "4": 0.020121306509479867, "3": 0.001845284154627954, "1": 0.00032787339990086574, "2": 8.197748619415891e-06}, "score": 4.974851874413097}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9838637007716535, "4": 0.014963221331053864, "3": 0.0009921939060228806, "1": 0.0001773681574450967, "2": 1.7363592880110965e-06}, "score": 4.982337677719603}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9678600486488895, "4": 0.030333538421739685, "3": 0.0015684075088052743, "1": 0.00022564603574595654, "2": 0}, "score": 4.965626637584052}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9849184747368748, "4": 0.013839215692713796, "3": 0.0009979384069902337, "1": 0.00024047005201941263, "2": 2.089054472199576e-06}, "score": 4.983196729673328}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9927376909400485, "4": 0.007085640554327302, "3": 0.0001461646254371312, "1": 2.8372704049259738e-05, "2": 0}, "score": 4.992508523412945}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9194249764010907, "4": 0.07421892555079088, "3": 0.005160354501538412, "1": 0.0011792219764000162, "2": 1.3095118903200043e-05}, "score": 4.91070388621504}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8119671786655558, "4": 0.16509176634737047, "3": 0.02071446563141663, "1": 0.002141837871637066, "2": 6.438994954492891e-05}, "score": 4.784714397509396}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9015038911877946, "4": 0.09270473768529938, "3": 0.004585727116109022, "1": 0.001040296614752196, "2": 0}, "score": 4.893945085719559}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9066183864654295, "4": 0.08771167185789666, "3": 0.004304324775404896, "1": 0.001342045951447307, "2": 1.4151216016579389e-05}, "score": 4.898268082849877}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.961216364684479, "4": 0.035703841176649376, "3": 0.001626852357661817, "1": 0.001427054142102656, "2": 1.3848564180263686e-05}, "score": 4.9552921536059635}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9784154124742093, "4": 0.020542867059934182, "3": 0.0006188706334083526, "1": 0.0004176150428058346, "2": 2.926164607831908e-06}, "score": 4.976540098848088}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"5": 0.802457207008318, "4": 0.1334241136289312, "3": 0.05772773182762224, "1": 0.005821999613760997, "2": 0.0005629944994181114}, "score": 4.72614181036917}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9459939692032482, "4": 0.04872622952211284, "3": 0.004967795990044496, "1": 0.0003019823457740328, "2": 8.641460068635579e-06}, "score": 4.940104241989779}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9412557932873652, "4": 0.05008999457087602, "3": 0.00818538035071876, "1": 0.00040538918567210267, "2": 4.791681841683037e-05}, "score": 4.9317728782499906}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9324852306822977, "4": 0.0620615713767292, "3": 0.004723762297357099, "1": 0.0007029252512802173, "2": 2.0796684146473857e-05}, "score": 4.925616387964744}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9193451737766231, "4": 0.07016480127749761, "3": 0.009254191453334715, "1": 0.0011660993370000252, "2": 6.285663875162192e-05}, "score": 4.906473205319476}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8665525633338669, "4": 0.11806041429328915, "3": 0.013274113416970584, "1": 0.0020080919226264926, "2": 9.94240024611056e-05}, "score": 4.847059894364182}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9835728900364109, "4": 0.016010690878002228, "3": 0.0002340342700791768, "1": 0.00017361731845991457, "2": 0}, "score": 4.982826620740449}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9556542686606333, "4": 0.03925594818975084, "3": 0.004728283683207041, "1": 0.00034545851303942354, "2": 1.1943564024812987e-05}, "score": 4.949869614295895}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974269449954087, "4": 0.0023139406471486467, "3": 0.00013168116155907967, "1": 0.00012575914851756012, "2": 0}, "score": 4.9969196552790205}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9845079930924086, "4": 0.014821604486920988, "3": 0.0005127509542346801, "1": 0.00015293462736542276, "2": 0}, "score": 4.983541077461059}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9528754656450649, "4": 0.04542762858004332, "3": 0.0016052271595259544, "1": 8.713150751199887e-05, "2": 2.6914647387425245e-06}, "score": 4.9510052257598245}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936105604372643, "4": 0.006178622060068318, "3": 0.00017639425199232685, "1": 3.306097414614217e-05, "2": 0}, "score": 4.99333633646161}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.997250621582749, "4": 0.0026266841702549913, "1": 6.464078497685895e-05, "3": 5.731329137345989e-05, "2": 0}, "score": 4.9970001238866715}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969505356905185, "4": 0.0029246455065056187, "1": 7.212130968434655e-05, "3": 5.2126296773817105e-05, "2": 0}, "score": 4.99668261476633}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9971229549494195, "4": 0.0026859709400038137, "1": 0.00011457739780131798, "3": 7.595108828946023e-05, "2": 0}, "score": 4.996703815493733}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"5": 0.960811748942116, "4": 0.0376038063874988, "3": 0.001381035912757376, "1": 0.00019640258504243578, "2": 4.953713800315668e-06}, "score": 4.958833565813006}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9988324830788247, "4": 0.001085648581082968, "1": 5.391774033349329e-05, "3": 2.6395711610575462e-05, "2": 0}, "score": 4.998645886928868}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9759438743612237, "4": 0.022645262728224404, "3": 0.0013272754124360581, "1": 7.817552022667827e-05, "2": 3.5452637506508836e-06}, "score": 4.974376800743557}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986343866996241, "4": 0.0013139229478797423, "3": 3.108357541464727e-05, "1": 2.015990151382448e-05, "2": 0}, "score": 4.9985432696442595}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999343776239055, "4": 0.0006128719098876746, "1": 2.349916897982661e-05, "3": 1.954611524448672e-05, "2": 0}, "score": 4.9992540389550175}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8788312405521878, "4": 0.1118201949453283, "3": 0.008533494752799077, "1": 0.0007868440395688319, "2": 2.289275667133676e-05}, "score": 4.867896056616606}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9709601613580602, "4": 0.027512520142721805, "3": 0.0010933044098605023, "1": 0.00042759862262282147, "2": 3.5258853151489175e-06}, "score": 4.968579808099918}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9662757113661147, "4": 0.029662934772982097, "3": 0.003441527036963332, "1": 0.0005991248205527901, "2": 1.3210904115809067e-05}, "score": 4.961017587137409}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9875317577274233, "4": 0.011300285365484606, "3": 0.0007745316762318877, "1": 0.00038638433397143875, "2": 4.007571945140078e-06}, "score": 4.985593047529363}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9769793786193783, "4": 0.022193207619627463, "3": 0.0005906097973405813, "1": 0.00023061866785539241, "2": 0}, "score": 4.975702947829815}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9637371919484151, "4": 0.03238041546178848, "3": 0.0030350126088446922, "1": 0.0008323265551317557, "2": 1.09341023152904e-05}, "score": 4.9581872785529235}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9850437229632736, "4": 0.014119315859043129, "3": 0.0005274113835482303, "1": 0.0003058196527061941, "2": 2.0177954578810806e-06}, "score": 4.983596501288196}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9980751223577289, "4": 0.0017848730263109746, "1": 7.022926173160707e-05, "3": 6.807476305887036e-05, "2": 0}, "score": 4.9977980566560385}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985283616233152, "4": 0.0014364392079526738, "3": 1.722158532834266e-05, "1": 1.6029897269554465e-05, "2": 0}, "score": 4.998464995042605}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9949911234690212, "4": 0.004610773263143, "1": 0.00025121007919280626, "3": 0.00014087015195543215, "2": 0}, "score": 4.9941026105959825}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9959021153382072, "4": 0.00384689980700524, "1": 0.00017189701680030917, "3": 7.703073961475247e-05, "2": 0}, "score": 4.9953114410017365}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9935248881725104, "4": 0.005734840732090177, "1": 0.0005198345344535768, "3": 0.00021671466012560797, "2": 0}, "score": 4.991752361112949}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9976736813829807, "4": 0.0021187584471245827, "3": 0.0001515092316330025, "1": 5.462362917816365e-05, "2": 0}, "score": 4.997359724804408}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981051683644174, "4": 0.0017718914272146014, "1": 7.46508983419433e-05, "3": 4.544803375467153e-05, "2": 0}, "score": 4.9978386027707815}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986380734648583, "4": 0.0013108912887844974, "1": 2.5625848727013673e-05, "3": 2.4182338628048833e-05, "2": 0}, "score": 4.998538238845384}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9045141683317361, "4": 0.07816157660061411, "3": 0.016745992551379128, "1": 0.0005282903077882803, "2": 4.277374834421984e-05}, "score": 4.8861041359456046}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9558026693983637, "4": 0.04082327069475479, "3": 0.0029622549299802817, "1": 0.0003822269560481685, "2": 0}, "score": 4.9517218836499595}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9619472774151944, "4": 0.03306162614863293, "3": 0.004389205709684129, "1": 0.0005811030210788887, "2": 1.5863383961232387e-05}, "score": 4.955787742480431}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9546469096336578, "4": 0.042832111029431644, "3": 0.0019577535715916334, "1": 0.0005414509918776868, "2": 0}, "score": 4.951085512757997}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9311454351457333, "4": 0.0634106975943804, "3": 0.004641383913472097, "1": 0.0007703285082562264, "2": 2.1277699617830245e-05}, "score": 4.924160562530728}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9850506636057974, "4": 0.012969191743264868, "3": 0.0012946571084642884, "1": 0.0006780228964627948, "2": 0}, "score": 4.981729266069395}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9925395379388955, "4": 0.006581635554620273, "3": 0.0006196661454720315, "1": 0.00025723204026804436, "2": 0}, "score": 4.991150086927892}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9774892818911188, "4": 0.01931501125801936, "3": 0.002981084853244808, "1": 0.00020762375218389778, "2": 0}, "score": 4.9738921413175525}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99767213868136, "4": 0.0021700827033785597, "1": 9.608762715161825e-05, "3": 6.057974267882923e-05, "2": 0}, "score": 4.997324404329413}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990751514363041, "4": 0.0008426021135968017, "1": 6.236215231613229e-05, "3": 1.8653001247920223e-05, "2": 0}, "score": 4.998870641884068}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9541050006652445, "4": 0.037118777698025435, "3": 0.008061871124213197, "1": 0.0006883996514128393, "2": 2.284135155533798e-05}, "score": 4.943935183059146}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9872376059590309, "4": 0.011525111678936962, "3": 0.0007538410659800961, "1": 0.0004666914618055724, "2": 7.5502642146332574e-06}, "score": 4.9850776522700535}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9826640688345424, "4": 0.016429787182486857, "3": 0.0007384261211963393, "1": 0.00016159214835011833, "2": 0}, "score": 4.981446878330613}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998825108426177, "4": 0.0011110935149441226, "3": 3.456250963193831e-05, "1": 2.7970868502972622e-05, "2": 0}, "score": 4.998707896357683}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9779512781801262, "4": 0.020635004452571087, "3": 0.0011359062369338065, "1": 0.00026207862599667275, "2": 0}, "score": 4.976044491689436}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9907820135436171, "4": 0.00891315503258679, "3": 0.00023445122205708848, "1": 6.663603904316355e-05, "2": 0}, "score": 4.990351362241058}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936675345078638, "4": 0.005821554247826006, "3": 0.0004177050485453295, "1": 8.902342683535843e-05, "2": 0}, "score": 4.992986912613619}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9860833918924643, "4": 0.011632120487101414, "1": 0.0012906258799676251, "3": 0.0009736915385638664, "2": 0}, "score": 4.981257614878209}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9787090173432813, "4": 0.01947724729586533, "3": 0.0013908419441432225, "1": 0.0004032858267081151, "2": 0}, "score": 4.976127457425989}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9866827951795328, "4": 0.012445589199605502, "3": 0.0005577094110264042, "1": 0.0003007638959061924, "2": 0}, "score": 4.985235742358208}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9094261252467176, "4": 0.07422245845572958, "3": 0.009093470049672278, "1": 0.0072047193673337685, "2": 5.025648322220534e-05}, "score": 4.878620593980862}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8461411240413969, "4": 0.13465107178117336, "3": 0.018682765707390466, "1": 0.0004632243796475481, "2": 5.342098028108321e-05}, "score": 4.825968775681384}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9915516872727888, "4": 0.008331748007331687, "3": 9.469342404935829e-05, "1": 1.863794502917896e-05, "2": 0}, "score": 4.991404285571493}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9829644719108287, "4": 0.016325462066394757, "3": 0.0005819808584702925, "1": 0.00012505086292809026, "2": 0}, "score": 4.982010318178835}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9531869638948394, "4": 0.04460623640601974, "3": 0.002137121604412408, "1": 6.065060180711187e-05, "2": 0}, "score": 4.950876474515649}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9767682312547584, "4": 0.02211704059348069, "3": 0.0010195274941955136, "1": 9.16539028772388e-05, "2": 2.0994419219614477e-06}, "score": 4.975470954979653}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9453724331269036, "4": 0.04937544713021657, "3": 0.004341898431066033, "1": 0.0008872143034899249, "2": 1.7709824781129213e-05}, "score": 4.938338442686762}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.974367482891609, "4": 0.02460880680272001, "3": 0.0009022616521299718, "1": 0.00011451548545112632, "2": 0}, "score": 4.973128421646047}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988979010576198, "4": 0.0010693029407946829, "1": 1.934332808026243e-05, "3": 1.1666944163301456e-05, "2": 0}, "score": 4.998829987769232}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9820484860993305, "4": 0.017025153684458855, "3": 0.0006899857588043153, "1": 0.00023215089226985498, "2": 1.9685250523979315e-06}, "score": 4.980660322041947}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9953436555420626, "4": 0.003643147402243652, "1": 0.0007595943630491745, "3": 0.0002485377033982211, "2": 2.1717570881830738e-06}, "score": 4.992814863679231}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995572352759751, "4": 0.004054650844719705, "3": 0.00022137310987760915, "1": 0.00014843238845497234, "2": 0}, "score": 4.994908857136392}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9734311508391165, "4": 0.023575090774830932, "3": 0.0028621505389996044, "1": 0.00012331259546628578, "2": 5.688209694620672e-06}, "score": 4.970190215420863}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935734889226725, "4": 0.0059905083740318735, "3": 0.0002839748159407516, "1": 0.00014740111703224478, "2": 0}, "score": 4.992851904453361}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916147519655353, "4": 0.0078292308888848, "3": 0.000381420430161104, "1": 0.0001713863831195474, "2": 0}, "score": 4.990722352933985}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9904461567380222, "4": 0.009073075386007, "3": 0.0004009738679452532, "1": 7.575470524941924e-05, "2": 1.9317195367990792e-06}, "score": 4.989816141435165}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959372354496365, "4": 0.003907446059947525, "3": 0.00011449401581044604, "1": 3.8429237302250984e-05, "2": 0}, "score": 4.995709838683268}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9765277365731747, "4": 0.022303960843221716, "3": 0.000937153001845527, "1": 0.00020472191743957987, "2": 0}, "score": 4.975002184849461}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960728823744052, "4": 0.0038108668348981684, "3": 9.344093803806275e-05, "1": 1.9918412554947715e-05, "2": 0}, "score": 4.995922565849149}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977159247786317, "4": 0.0021885632514820016, "3": 5.129188527876919e-05, "1": 3.8563204014943716e-05, "2": 0}, "score": 4.997554586328489}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9631109085323704, "4": 0.03160271956211984, "3": 0.004840105795103652, "1": 0.0004292955278908966, "2": 1.5386439321614916e-05}, "score": 4.956953659226577}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9252043471779268, "4": 0.06315542672437935, "3": 0.009838185355657338, "1": 0.001704134877917585, "2": 9.49307385649719e-05}, "score": 4.910066603273793}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9790538782526551, "4": 0.018036550438681853, "3": 0.0015333475384371018, "1": 0.0013656387651328097, "2": 7.779052607529528e-06}, "score": 4.973410787658024}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941008791466786, "4": 0.005686649752194932, "3": 0.0001700496678095318, "1": 3.971099327154863e-05, "2": 0}, "score": 4.993814390173375}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9663214656042709, "4": 0.028149505251107494, "3": 0.0041045465706433994, "1": 0.0014045532475986952, "2": 1.794196814987756e-05}, "score": 4.957969279182663}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9738729152583209, "4": 0.02228131152680607, "3": 0.0033950241655991724, "1": 0.0004223872545140017, "2": 2.1443950078404283e-05}, "score": 4.969174546028002}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9911524172650784, "4": 0.008118758748326143, "1": 0.0004102765965466599, "3": 0.0003100599165399389, "2": 0}, "score": 4.9896199269318116}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9911501911392492, "4": 0.006837921279790384, "3": 0.0014374019447027995, "1": 0.0005603243754813217, "2": 9.36764338266182e-06}, "score": 4.9880178169607285}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978633264437339, "4": 0.002009294929083279, "1": 6.634547489760903e-05, "3": 6.028851118474472e-05, "2": 3.4246889530361206e-07}, "score": 4.997603717778553}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9825389571318678, "4": 0.015793631339281855, "3": 0.0014232006000392487, "1": 0.0002351046085737001, "2": 7.2672907318139955e-06}, "score": 4.9803977111049615}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9679989784755211, "5": 0.020252071385883665, "3": 0.006043924659420593, "4": 0.00415585124173923, "2": 0.0015464368512595674}, "score": 1.1071104186414324}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9907149596860686, "4": 0.009019572867180128, "3": 0.0002048585125079032, "1": 5.67493701694518e-05, "2": 0}, "score": 4.990343675357923}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9890871509191257, "4": 0.010703487029474414, "3": 0.0001734006057943905, "1": 3.319348288352322e-05, "2": 0}, "score": 4.9888169068730175}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941377560027598, "4": 0.005778091737676558, "3": 5.707656191004693e-05, "1": 2.1554865276609404e-05, "2": 0}, "score": 4.994021502671116}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9926642747461948, "4": 0.007056766748575877, "3": 0.00020816240284639658, "1": 6.813435454401949e-05, "2": 0}, "score": 4.9922543504105885}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9880096866309429, "4": 0.011102594047433308, "3": 0.0007285254486461747, "1": 0.00015262372185238787, "2": 3.6401014712031922e-06}, "score": 4.986818901242177}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9655961213845659, "4": 0.031992147401483914, "3": 0.0021541802978794467, "1": 0.00024463188194797703, "2": 9.131313566937838e-06}, "score": 4.9626934292274}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9766001595320931, "4": 0.022634913944026145, "3": 0.0006157533995427377, "1": 0.00013768804158131333, "2": 0}, "score": 4.975582546654091}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9710006172559748, "4": 0.02685345469026407, "3": 0.0016514404036151896, "1": 0.00047892382616254183, "2": 1.1009720429148396e-05}, "score": 4.967894793826134}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9465323721150385, "4": 0.051069950887157996, "3": 0.0022733458271413493, "1": 0.00011543638026223657, "2": 5.865346490146565e-06}, "score": 4.943903845957887}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9986302239008594, "4": 0.0010992857810635942, "1": 0.0002583071957861073, "3": 1.2129064024763595e-05, "2": 0}, "score": 4.997843227191151}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954682684234686, "4": 0.004499495498208726, "3": 2.5391654523374428e-05, "1": 6.757294296693622e-06, "2": 0}, "score": 4.9954226916167395}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9952874361387863, "4": 0.00253270595593768, "1": 0.0018820467453557865, "3": 0.00029697428660414746, "2": 4.922953478767059e-07}, "score": 4.989343677931454}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975768652422077, "4": 0.002415612018921445, "3": 6.8024888866900636e-06, "1": 5.642942509247004e-07, "2": 0}, "score": 4.997568525447099}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973554318477513, "4": 0.002621436051782327, "1": 1.1968576114276424e-05, "3": 1.1066799143316256e-05, "2": 0}, "score": 4.997308555785144}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9454651314384321, "4": 0.05171952030328358, "3": 0.0025159686511974618, "1": 0.0002884813842772743, "2": 7.978006418152467e-06}, "score": 4.9420705136713226}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9498911632030957, "4": 0.047233343769710105, "3": 0.002546316942870197, "1": 0.0003143583439452879, "2": 8.506661461913549e-06}, "score": 4.946390730652053}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9469658790645805, "4": 0.05043570107534632, "3": 0.0021202942558516736, "1": 0.0004620363455293074, "2": 7.933216444103763e-06}, "score": 4.943451304167948}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9704457062878286, "4": 0.027994920387408147, "3": 0.0009568881968826341, "1": 0.0005920920176141642, "2": 0}, "score": 4.967722599685789}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9495912558259297, "4": 0.04904828784009941, "3": 0.0011306766727950234, "1": 0.0002221917078193229, "2": 0}, "score": 4.947801195900943}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9755528783315762, "4": 0.02243744643577497, "3": 0.0013412453914988924, "1": 0.0006287351846555681, "2": 2.0097723661183e-05}, "score": 4.972304286120577}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.990902325563065, "4": 0.008596331813739295, "3": 0.00025320882865410155, "1": 0.00024420744730700597, "2": 0}, "score": 4.98992038116364}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9776811447196367, "4": 0.020888644354300274, "3": 0.0007724581696336929, "1": 0.0006465070855187297, "2": 0}, "score": 4.974980129599129}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9858290289949676, "4": 0.01350663139094301, "3": 0.000470308686057153, "1": 0.00018389198698107978, "2": 0}, "score": 4.984817029349774}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9959832358650327, "4": 0.0036806629263323835, "1": 0.0001978795590456426, "3": 0.0001356400326494791, "2": 1.2704975024360117e-06}, "score": 4.995252721055429}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9610504077053639, "4": 0.035190293051175964, "3": 0.0034800625890440604, "1": 0.0002588784270742712, "2": 1.1340116345194163e-05}, "score": 4.956779657947561}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9970452120043449, "4": 0.0027887146171711084, "3": 9.967297309926794e-05, "1": 6.569682233037138e-05, "2": 4.5245750039335384e-07}, "score": 4.996747793958096}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9797632021245711, "4": 0.01857330396406226, "3": 0.001253544299931472, "1": 0.0004022705845005906, "2": 5.018723196189237e-06}, "score": 4.977295408527374}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999336036771202, "4": 0.0006076792892216414, "1": 4.040039483101499e-05, "3": 1.5412264028321553e-05, "2": 0}, "score": 4.999199894226323}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987594680966538, "4": 0.001161697478468813, "1": 4.048261237952684e-05, "3": 3.781082956282308e-05, "2": 0}, "score": 4.998600749655917}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9344500075371106, "4": 0.055459952237563816, "3": 0.008990914603703248, "1": 0.0010183023510401644, "2": 6.324743402210847e-05}, "score": 4.922293901099109}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9887386847111421, "4": 0.01084957142256768, "3": 0.00028371878614357046, "1": 0.00012388052065130076, "2": 0}, "score": 4.988087419550141}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9879362683830722, "4": 0.01135647742049316, "3": 0.0005602332741446081, "1": 0.00013857789107304613, "2": 0}, "score": 4.986968634442699}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9910621293747559, "4": 0.00852824229721416, "3": 0.00033412078454026395, "1": 6.814239487222575e-05, "2": 0}, "score": 4.990530876812716}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9928485035270673, "4": 0.006865523405919439, "3": 0.0001861551671574326, "1": 9.875771802716953e-05, "2": 5.372872334800834e-07}, "score": 4.992365519533927}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9388326191776196, "4": 0.052187347423337874, "3": 0.007496563975623753, "1": 0.001439948399092242, "2": 3.756194955071931e-05}, "score": 4.92694660984978}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9862439590617508, "4": 0.012964687028567495, "3": 0.0007664485386511545, "1": 2.255939385104768e-05, "2": 0}, "score": 4.985412144095948}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918632034046645, "4": 0.007160975960257821, "3": 0.000828566880128691, "1": 0.0001451377886803927, "2": 1.643786723462397e-06}, "score": 4.990596403324406}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963100699850909, "4": 0.0034067006751628557, "1": 0.00014251105248001865, "3": 0.00013791348357861143, "2": 0}, "score": 4.995747416220097}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9903841755665294, "4": 0.009048659081846464, "3": 0.0004211965367833537, "1": 0.00013906640570911344, "2": 0}, "score": 4.989552610109591}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9567521380289632, "4": 0.03360404608722995, "3": 0.0076662170430467, "1": 0.001953741552449866, "2": 1.991297557050236e-05}, "score": 4.943188590608199}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.997533218917192, "4": 0.002174914338097171, "1": 0.000151028197526007, "3": 0.00013895047267754613, "2": 0}, "score": 4.996943066154724}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9843757234845278, "4": 0.013634403654745685, "3": 0.0019109897068542872, "1": 7.204843188619013e-05, "2": 0}, "score": 4.9822553019239235}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99698975559877, "4": 0.0026163593202077977, "1": 0.00025448974944874335, "3": 0.0001374209108724347, "2": 0}, "score": 4.996090832141911}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921314900774527, "4": 0.007537817463036319, "3": 0.0003092211009147794, "1": 1.887307980857995e-05, "2": 0}, "score": 4.991768226627458}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9284256377317802, "4": 0.057708615568668145, "3": 0.013206567965425268, "1": 0.0006096122247921593, "2": 4.450121792791405e-05}, "score": 4.913305856816431}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9815997492850954, "4": 0.016528442404365837, "3": 0.0014063599618152447, "1": 0.00045297152190918464, "2": 8.252296769992778e-06}, "score": 4.978822105227405}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7742941955510745, "4": 0.12815789763729718, "3": 0.07133517037781312, "1": 0.02460213625942879, "2": 0.0015511036021757818}, "score": 4.626087659260254}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9750351181671216, "4": 0.023364969691636713, "3": 0.0014372086271421348, "1": 0.00015490725112258396, "2": 5.438202361283313e-06}, "score": 4.973124606068697}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9417434251105565, "4": 0.049403485529499004, "3": 0.007986058061155144, "1": 0.0008067801141452618, "2": 5.1632977023749756e-05}, "score": 4.931241786387977}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9251961813603944, "4": 0.067670171119917, "3": 0.00693996186108096, "1": 0.00017072952139004043, "2": 1.7529664462027004e-05}, "score": 4.917713951555974}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9593338726734992, "4": 0.039452526131055876, "3": 0.0011259681901213108, "1": 7.939088458634968e-05, "2": 0}, "score": 4.95797762759689}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8876832411881064, "4": 0.10346320880028347, "3": 0.008287814296718491, "1": 0.0005397248960391257, "2": 1.9513773663861553e-05}, "score": 4.877742927391407}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9819919325375117, "4": 0.017408851416656705, "3": 0.0005202306432573567, "1": 7.404200430910314e-05, "2": 0}, "score": 4.981254426612757}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9788361256430996, "4": 0.02024743824200245, "3": 0.0008422839228725974, "1": 6.661831621401886e-05, "2": 0}, "score": 4.97780135340555}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.930067011550554, "4": 0.06450953736419343, "3": 0.004775402573580347, "1": 0.0006170922694128708, "2": 2.637824343209428e-05}, "score": 4.923391802968463}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9018191300819316, "4": 0.09527610826641716, "3": 0.0025483186250818456, "1": 0.0003316620596741378, "2": 0}, "score": 4.898298085972957}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8331333796543511, "4": 0.14859596507417488, "3": 0.01766564828508658, "1": 0.0005468396187982327, "2": 4.631151146597553e-05}, "score": 4.813744237124534}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.860647126522194, "4": 0.12794208223534514, "3": 0.008913301209527979, "1": 0.002345783072479436, "2": 8.749490455093089e-05}, "score": 4.844575718229359}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9803060383866792, "4": 0.018324326224299695, "3": 0.0009215603425829461, "1": 0.0004403187770830631, "2": 4.6342091461948036e-06}, "score": 4.978057306848354}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9114768343973865, "4": 0.08364895869358062, "3": 0.004028612722016399, "1": 0.0008327080145449952, "2": 9.162055544790831e-06}, "score": 4.9049351436049315}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9491268948813011, "4": 0.04698220810020905, "3": 0.0021610144818979406, "1": 0.0017198838835493153, "2": 5.392561791302638e-06}, "score": 4.941799781640907}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.993796672578241, "4": 0.0055801144056189635, "3": 0.0003575776559422689, "1": 0.00026353852387631674, "2": 1.120464753776294e-06}, "score": 4.992647207613673}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9795202020016204, "4": 0.019064812890766485, "1": 0.0007815991068159341, "3": 0.0006281882344642608, "2": 2.7755989395017787e-06}, "score": 4.976544030601939}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9756879110233269, "5": 0.024215363303444298, "1": 6.50278446868094e-05, "3": 2.6692898545862188e-05, "2": 2.0987492204292396e-06}, "score": 4.023989459090101}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.882185603770291, "4": 0.08486027487963252, "3": 0.025310701208712642, "1": 0.007384212527733679, "2": 0.00024874880150687305}, "score": 4.834233492466729}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9064081605991599, "4": 0.07647654396516734, "3": 0.0159095041985476, "1": 0.0011146609511474986, "2": 6.93254136262421e-05}, "score": 4.887035364412809}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9472564215085421, "4": 0.041328200136641534, "3": 0.010522126008791316, "1": 0.0008658017514774171, "2": 2.3153976989120224e-05}, "score": 4.934094595738583}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9024031207196764, "4": 0.08485910381591957, "3": 0.011201278000537164, "1": 0.0014576398388784517, "2": 5.868866208244573e-05}, "score": 4.886729430291327}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9268896781920859, "4": 0.06224656038645432, "3": 0.009516035081192871, "1": 0.0012760502678100922, "2": 5.023995155883295e-05}, "score": 4.913464593541809}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9681094595992573, "4": 0.028185401849053417, "3": 0.003356456750384769, "1": 0.000328973288652838, "2": 1.3464378358200271e-05}, "score": 4.9637451719804755}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9603393282959901, "4": 0.030942798149445287, "3": 0.007852844155536958, "1": 0.0007470443528217618, "2": 0}, "score": 4.950357479053065}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9417241892558117, "4": 0.04763647165000972, "3": 0.009888676147418769, "1": 0.0006287294631914201, "2": 0}, "score": 4.930062730507487}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9663743383633668, "4": 0.029760972245834304, "3": 0.0034079682035596825, "1": 0.00041407145599943804, "2": 2.0527810118746105e-05}, "score": 4.961704374919895}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9856513522833065, "4": 0.012795982813638243, "3": 0.0013157255716575277, "1": 0.0002266474118026491, "2": 6.5398521485896776e-06}, "score": 4.983646295479189}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8573262023152965, "4": 0.09343567942515613, "1": 0.02458332282224755, "3": 0.024155014033473726, "2": 0.0004975865732111093}, "score": 4.758427711289017}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9777754984357807, "4": 0.020706512803654823, "3": 0.0011495684131040535, "1": 0.00036486395495942365, "2": 2.6655290559304883e-06}, "score": 4.975526876160919}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9657931192236463, "4": 0.031709175247320726, "3": 0.002136918801195315, "1": 0.00035373118418658534, "2": 4.670326847381076e-06}, "score": 4.962587962197179}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9940604681767706, "4": 0.005768404806673351, "3": 0.00010210161654102931, "1": 6.788550648590257e-05, "2": 0}, "score": 4.993755842816626}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9361938212091451, "4": 0.05827877016831735, "3": 0.004365700157146839, "1": 0.0011272333626602363, "2": 2.3265755488879462e-05}, "score": 4.928410296326434}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9548667347529421, "4": 0.03872661070999884, "3": 0.00610087363015135, "1": 0.00022536528123739892, "2": 0}, "score": 4.948166012642225}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9923602454155274, "4": 0.007087339894674988, "3": 0.00039301412706924506, "1": 0.00015385822445561102, "2": 0}, "score": 4.991511151905296}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9691032690139798, "4": 0.029064522693513957, "3": 0.0015590674888659784, "1": 0.00024692176806182415, "2": 1.5424660471302636e-05}, "score": 4.966783022718579}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9316922059202492, "4": 0.061686097352521105, "3": 0.005585077333019929, "1": 0.0009917108252303684, "2": 3.114680145579248e-05}, "score": 4.923082405754099}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.98924181272053, "4": 0.010044470448743483, "3": 0.0005989474459550297, "1": 0.0001113453416878936, "2": 2.1809303634060967e-06}, "score": 4.988305695964167}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8412348896227231, "4": 0.1445753288995145, "3": 0.013540059731814777, "1": 0.0005929285827680322, "2": 4.8344601350164194e-05}, "score": 4.82582633198473}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.82349110572465, "4": 0.16777018206407393, "3": 0.008144663104747171, "1": 0.0005519036908539771, "2": 2.8225661825542454e-05}, "score": 4.813645605970245}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8639270211561607, "4": 0.12594776770509652, "3": 0.008890842184755937, "1": 0.001143362267432884, "2": 0}, "score": 4.851683601071632}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9699170108204749, "4": 0.029048503838156218, "3": 0.0008908834028993457, "1": 0.0001349949753294999, "2": 4.149938678897969e-06}, "score": 4.968617159764603}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9667921072247536, "4": 0.03136588317033339, "3": 0.0016854484637434705, "1": 0.00014252815483243675, "2": 8.156854020745294e-06}, "score": 4.964668429107802}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.95522834535376, "4": 0.043388953409890144, "3": 0.0011810422117810803, "1": 0.00019600272417074773, "2": 3.3948804877611315e-06}, "score": 4.953454661369846}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9868684017484031, "4": 0.012631570544928094, "3": 0.0003001368561989637, "1": 0.00019589142623502453, "2": 0}, "score": 4.985984533983939}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9932266720966876, "4": 0.0065200841283868695, "3": 0.00017311750056448497, "1": 7.845651780144325e-05, "2": 0}, "score": 4.992819842810164}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9934420552959224, "4": 0.006184721515126285, "1": 0.00021623581709305013, "3": 0.0001524612641127167, "2": 0}, "score": 4.9926453794004715}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9789170023825254, "4": 0.019883647872385217, "3": 0.0008848574494481963, "1": 0.0003079284830014749, "2": 3.752313405718459e-06}, "score": 4.97710360198329}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9887263364308178, "4": 0.010147488931632804, "3": 0.0009297382156413512, "1": 0.00019177418459723834, "2": 2.0534443581933597e-06}, "score": 4.987219744224579}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9771887775073466, "4": 0.017613334883238428, "3": 0.003775763745710193, "1": 0.001402994216652044, "2": 1.6028598900460295e-05}, "score": 4.969174979372158}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.958197085670863, "4": 0.03739252727525086, "3": 0.004026732604451342, "1": 0.0003500666475630479, "2": 1.4460482122275896e-05}, "score": 4.953109462588925}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9956215113538582, "4": 0.003623312559073285, "1": 0.0004248743839096007, "3": 0.0003268932150105445, "2": 0}, "score": 4.9940233831040395}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9845680824024478, "4": 0.01506270737787971, "3": 0.00029218336221054444, "1": 7.325419808270992e-05, "2": 0}, "score": 4.9840598489686085}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9802479579548316, "4": 0.016385262110178274, "3": 0.0030764928987808376, "1": 0.00028072528507797447, "2": 8.580057009693982e-06}, "score": 4.9763130875276165}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.97234232530212, "4": 0.01262391813209314, "3": 0.0002684794992008122, "1": 4.13370651175825e-05, "2": 0}, "score": 4.986474627840867}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.974799105359273, "4": 0.023811181445399458, "3": 0.001306268473446196, "1": 8.136177417372607e-05, "2": 1.6685042359180658e-06}, "score": 4.973245817910209}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977134309907943, "4": 0.002106764332925915, "1": 0.0001471847437564059, "3": 3.18668905809776e-05, "2": 0}, "score": 4.997240760833064}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975855241472195, "4": 0.001945169809630555, "1": 1.5812227892564005e-05, "3": 6.2998105276200095e-06, "2": 0}, "score": 4.997978077466108}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9746901435315429, "4": 0.024031800616945823, "3": 0.001107445463662623, "1": 0.00016345480955334802, "2": 4.426085494926275e-06}, "score": 4.973086137499837}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9885743887795874, "4": 0.010915723568201242, "3": 0.00043794172692024173, "1": 6.92374262347566e-05, "2": 0}, "score": 4.987931410585256}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984806983091377, "4": 0.001410645327806349, "1": 5.7742793744125755e-05, "3": 5.037129947243419e-05, "2": 0}, "score": 4.998257639953444}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948325310419011, "4": 0.004903561995989177, "3": 0.00023515915917051385, "1": 2.826831476976749e-05, "2": 2.9445254039477336e-07}, "score": 4.994512162053524}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955104386466141, "4": 0.004173221497754576, "1": 0.00016408433902173112, "3": 0.00014942902903854026, "2": 0}, "score": 4.994871568592633}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9865421604773438, "4": 0.012780799158803981, "3": 0.0006086257568021705, "1": 6.441075085786311e-05, "2": 2.4533110421819917e-06}, "score": 4.98573692427549}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9221196745384875, "4": 0.07117815638358439, "3": 0.006364332009036115, "1": 0.0003166473069037834, "2": 1.7958482355945452e-05}, "score": 4.914772439529579}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9251185384541671, "4": 0.06849148828827643, "3": 0.006044674152545977, "1": 0.00032434720356534953, "2": 1.4155221377443931e-05}, "score": 4.918078752135726}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9745487087099113, "4": 0.024390745534531806, "3": 0.000903257034481058, "1": 0.00015338982516683068, "2": 1.9981356243232333e-06}, "score": 4.9731831357165355}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9586026594060716, "4": 0.03839130796840754, "3": 0.002479673204170256, "1": 0.0005182027412004024, "2": 6.186085885173042e-06}, "score": 4.954557886852827}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9491159448674802, "4": 0.04517820042347286, "3": 0.003713436688539462, "1": 0.001954023888502484, "2": 2.403032460462041e-05}, "score": 4.939505870745604}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8925903124746177, "4": 0.06500947828161549, "1": 0.023149532338838798, "3": 0.018986941985706184, "2": 0.00025426615124478504}, "score": 4.803653850781752}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.911456344628455, "4": 0.07915195444778257, "3": 0.008056363523648377, "1": 0.0012693703358546738, "2": 5.7851336600618044e-05}, "score": 4.899483467386895}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9882472524764487, "4": 0.010494156505719715, "1": 0.000770054705142928, "3": 0.0004840695321979327, "2": 2.458367613571656e-06}, "score": 4.9854500812842275}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9777259274523957, "4": 0.020564841183282594, "3": 0.001346293524284416, "1": 0.00035540886458396994, "2": 5.4282378384132075e-06}, "score": 4.975304599717741}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8168040449111728, "4": 0.15164122651992845, "3": 0.028198598524099786, "1": 0.0032424200466868985, "2": 0.0001094376037378476}, "score": 4.778662637793411}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9639256730397645, "4": 0.034364765439350964, "3": 0.0013199122788615934, "1": 0.00037883625162646263, "2": 7.661421630367076e-06}, "score": 4.961456959260485}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979241059546026, "4": 0.001831407467165306, "1": 0.0001388200594223075, "3": 0.00010438354603139351, "2": 0}, "score": 4.99740454187318}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9877083856758158, "4": 0.011924800165001612, "3": 0.0002977509973834398, "1": 6.651982729032685e-05, "2": 0}, "score": 4.987213586010942}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.941851481299434, "4": 0.051918401230576734, "3": 0.00541793517574741, "1": 0.0007929340539514306, "2": 1.7331238346165067e-05}, "score": 4.934021872006885}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9739918674647243, "4": 0.02496288143591029, "3": 0.0008936729298588851, "1": 0.0001471282356650513, "2": 2.7581510834979785e-06}, "score": 4.972652939043175}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9955129197603723, "4": 0.004309277596222739, "3": 0.00014689639729001348, "1": 2.9454348550692875e-05, "2": 0}, "score": 4.995279105360739}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9745980825472701, "4": 0.022967438121473255, "3": 0.002215612256301778, "1": 0.00021104567050894186, "2": 4.388542019712302e-06}, "score": 4.971743892058496}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9867496511239231, "4": 0.012718744865941111, "3": 0.0004582376142401602, "1": 6.72953780831201e-05, "2": 0}, "score": 4.986095513978864}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929508724777094, "4": 0.006637614115629412, "3": 0.00025073837327346, "1": 0.00015670225784424643, "2": 0}, "score": 4.992234068477551}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9992320006625727, "4": 0.0006768990567064671, "1": 6.272571919089495e-05, "3": 2.7541791939135437e-05, "2": 0}, "score": 4.999017113664134}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9925651413227711, "4": 0.00620844200113056, "3": 0.0009173458527980366, "1": 0.0003025705755808798, "2": 0}, "score": 4.990746523841063}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958847369979209, "4": 0.003102026721449696, "1": 0.0005695076171573126, "3": 0.00044051220756418253, "2": 2.4064353820186713e-06}, "score": 4.99373169401119}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963275886575939, "4": 0.002990333677440279, "1": 0.0003949238091090571, "3": 0.00028454532571139577, "2": 1.6448982989576454e-06}, "score": 4.994855940782824}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993654426167479, "4": 0.0004937830535948609, "1": 0.0001103205873981121, "3": 2.981541548652414e-05, "2": 0}, "score": 4.9990053031308985}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8082858324376453, "4": 0.16811545558367927, "3": 0.021293402415479872, "1": 0.002218300315469092, "2": 6.680958497936545e-05}, "score": 4.780219670080004}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9688945146765203, "4": 0.03041749629827169, "3": 0.0004269116392457992, "1": 0.0002455875635462632, "2": 0}, "score": 4.9677458305576945}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9116586101162794, "4": 0.08447362698675939, "3": 0.0020258469883916532, "1": 0.0018034153414059504, "2": 0}, "score": 4.904257331523795}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9571622707413409, "4": 0.04100081641151928, "3": 0.0009175985246372121, "1": 0.0009061612387866433, "2": 0}, "score": 4.953538730475092}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9760226879390835, "4": 0.022150382810483434, "3": 0.0009292374076205599, "1": 0.0008871099732225742, "2": 7.369991537498379e-06}, "score": 4.972420503924795}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9594353602156706, "4": 0.035887992865620076, "3": 0.003910062188985368, "1": 0.0007437135579642405, "2": 2.0021116828375858e-05}, "score": 4.95325683195347}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9568810260064491, "4": 0.04076826576878074, "3": 0.0015714198582569955, "1": 0.0007657919736318257, "2": 7.044622486978084e-06}, "score": 4.953004289547183}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.991021151785007, "4": 0.008409493775263384, "3": 0.00032766592171250275, "1": 0.0002384448526878758, "2": 1.502901477360988e-06}, "score": 4.989976868818224}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979383481296953, "4": 0.0020178382780088773, "1": 2.5939205705391926e-05, "3": 1.7377331299558327e-05, "2": 0}, "score": 4.9978436491647455}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9815306117600687, "4": 0.017825319296412408, "3": 0.0004892628927332693, "1": 0.0001476502878844622, "2": 0}, "score": 4.980605414983532}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9736198298138061, "4": 0.023794942996981937, "3": 0.0021287081193576084, "1": 0.0004463352083573659, "2": 7.932296244368876e-06}, "score": 4.97013843580688}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9612467617101995, "4": 0.03343929411465325, "3": 0.004522142468425626, "1": 0.0007676546503298276, "2": 2.017379647223098e-05}, "score": 4.9543850997179035}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.992619401379271, "4": 0.006054932801844114, "1": 0.00098273141997227, "3": 0.0003379079624518719, "2": 2.5635206252930013e-06}, "score": 4.989330608753675}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878967062794258, "4": 0.011259016552556483, "3": 0.0006355731294985708, "1": 0.00020240437604682112, "2": 0}, "score": 4.986660135647617}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9498418964758035, "4": 0.04680116421401996, "3": 0.002549581629844161, "1": 0.0007816073918103771, "2": 1.605384778078564e-05}, "score": 4.944924547379845}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9694334241027974, "4": 0.0275153458236367, "3": 0.002777528431886754, "1": 0.00025753137516037675, "2": 8.752247792623014e-06}, "score": 4.965872961913562}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9843729495176476, "4": 0.013970959851787612, "3": 0.0015395774243251092, "1": 0.00010801645298384251, "2": 3.7877154661288466e-06}, "score": 4.982506373963082}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9927944456884562, "4": 0.006983735035173092, "3": 0.0001434897433832815, "1": 7.036848860837285e-05, "2": 0}, "score": 4.9924477513998395}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987614919848905, "4": 0.0012114074663868806, "3": 1.3266625995666097e-05, "1": 1.2873997223514283e-05, "2": 0}, "score": 4.998710562054964}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9859030724646728, "4": 0.013723969175737575, "3": 0.0002783854204356893, "1": 9.169066346229729e-05, "2": 0}, "score": 4.98535245511128}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"5": 0.878801782622722, "4": 0.08954216923747677, "3": 0.029940511978097606, "1": 0.0016194381676224129, "2": 8.890777157268128e-05}, "score": 4.843831207932755}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9934927683301485, "4": 0.006339867562162519, "3": 0.00015108862088888446, "1": 1.4599562433606899e-05, "2": 0}, "score": 4.993299545716871}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.988232933865739, "4": 0.009247528059340331, "1": 0.0012600001991036416, "3": 0.0012480624128361469, "2": 5.588212999450071e-06}, "score": 4.98319948277073}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9921571905844432, "4": 0.007514343636830838, "3": 0.0002162131135242133, "1": 0.00010655524232712223, "2": 0}, "score": 4.99162696146207}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989342938685534, "4": 0.001020065946851441, "1": 2.2010146640482625e-05, "3": 1.9358286253457597e-05, "2": 0}, "score": 4.9988531719951155}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9913945397760973, "4": 0.007795785592186275, "3": 0.0007639267120768394, "1": 4.1258970589093204e-05, "2": 2.29684641452391e-06}, "score": 4.990504413746762}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9896495860447252, "4": 0.00976670037761741, "3": 0.0004698382835601598, "1": 0.00011151426924062424, "2": 1.253635284202557e-06}, "score": 4.988843792718179}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9945785792335844, "4": 0.0043862220643559255, "1": 0.0005228687925704211, "3": 0.0005079944681061025, "2": 2.0541303231587695e-06}, "score": 4.992500134328655}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972477719431693, "4": 0.0026245086012142483, "3": 9.415106417038788e-05, "1": 3.31769566444223e-05, "2": 2.09094820764166e-07}, "score": 4.997053853622203}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977036968471905, "4": 0.0021335223065764345, "3": 9.267451891860268e-05, "1": 6.86766706071977e-05, "2": 0}, "score": 4.997406418265226}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8393394462588313, "4": 0.15026185602916192, "3": 0.010108546751009759, "1": 0.00023826811136455135, "2": 3.8330869279514474e-05}, "score": 4.828450660582244}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9023222690222701, "4": 0.08773388326505656, "3": 0.009402337033707308, "1": 0.0005048327861776405, "2": 3.214440983513134e-05}, "score": 4.891345185708564}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8685576992384532, "4": 0.1127746950215902, "3": 0.018163861331947504, "1": 0.0004265273783540916, "2": 5.94640279802734e-05}, "score": 4.849010400198539}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9718037676859467, "4": 0.02561448415984685, "3": 0.002134841230867528, "1": 0.0004352175225590378, "2": 9.0792497083882e-06}, "score": 4.968347642921624}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9868485471427564, "4": 0.012149405991247194, "3": 0.0006163854867359497, "1": 0.0003811584461984379, "2": 3.217181153428957e-06}, "score": 4.985083518528131}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8123069199524386, "4": 0.16869033198391958, "3": 0.01834599104522186, "1": 0.0005511940130440862, "2": 9.537901235419787e-05}, "score": 4.792124655835343}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9468853903856774, "4": 0.05192045723997418, "3": 0.0011331008380158617, "1": 5.08640841187405e-05, "2": 0}, "score": 4.9456093306451745}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8771994144151634, "4": 0.1092460282891495, "3": 0.013213926072824692, "1": 0.0002728304549080666, "2": 5.033026358775862e-05}, "score": 4.863081414918066}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9866998540858439, "4": 0.012991350358594706, "3": 0.0002848069430604842, "1": 2.0180717271270122e-05, "2": 0}, "score": 4.986358260939887}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.988725515788299, "4": 0.010363757653982964, "3": 0.0005958330783549861, "1": 0.0003106368540220239, "2": 2.2663793496320665e-06}, "score": 4.987195204150476}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9657659924074843, "4": 0.033096087698659085, "3": 0.00055478012160782, "1": 0.0005468658677299042, "2": 0}, "score": 4.9636055684190685}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9891109387511529, "4": 0.010297068869732875, "3": 0.00030695389524807695, "1": 0.0002801879303819522, "2": 0}, "score": 4.987968213257418}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9650553546082137, "4": 0.031625171785393626, "3": 0.0029149896785270455, "1": 0.00039215240714392827, "2": 8.60813389456336e-06}, "score": 4.960950269430041}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912135484755276, "4": 0.007743475199220214, "1": 0.0005584480281039319, "3": 0.0004791964113627636, "2": 0}, "score": 4.989064281557637}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.985613826786546, "4": 0.013677953170796816, "3": 0.0005175605680309628, "1": 0.000187009245716069, "2": 2.4084528200572796e-06}, "score": 4.984531644143583}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9598371541528664, "4": 0.03665622188937326, "3": 0.0024460336124711114, "1": 0.0010445720489275438, "2": 1.0488302179395266e-05}, "score": 4.95424170474033}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9243877014777314, "4": 0.07061413090848948, "3": 0.002900664587909745, "1": 0.002063652103655893, "2": 0}, "score": 4.915327065244139}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9340033537695983, "4": 0.05856636636434631, "3": 0.005630291848920126, "1": 0.001760224361379816, "2": 2.5410324249733026e-05}, "score": 4.9230548170998265}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9559201925611546, "4": 0.04150439307994109, "3": 0.00201366003465362, "1": 0.0005460756711349914, "2": 0}, "score": 4.9522832360316205}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9555776263504525, "4": 0.04271136221996271, "3": 0.0015754982618572798, "1": 0.00012751953365031332, "2": 0}, "score": 4.953627192434467}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9883709106968847, "4": 0.011271746432288354, "3": 0.0002498069845737895, "1": 0.00010225871851765776, "2": 0}, "score": 4.987819540446166}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9905716423293184, "4": 0.00913859157526344, "3": 0.0002558940669757235, "1": 3.189143753608982e-05, "2": 0}, "score": 4.990222035174493}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9950814195279707, "4": 0.0047437230404930655, "3": 0.00013135223846380214, "1": 4.116583060338919e-05, "2": 0}, "score": 4.9948288970630825}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9955747153553046, "4": 0.004318572375401406, "1": 6.998931292993753e-05, "3": 3.237257319441585e-05, "2": 0}, "score": 4.995336704939371}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989731962241372, "4": 0.0010063480429402445, "3": 1.023144230661192e-05, "1": 9.330312962418681e-06, "2": 0}, "score": 4.998935866869285}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9147148972180479, "4": 0.07926800496829413, "3": 0.005812080399545166, "1": 0.00018914701275593132, "2": 1.1874111878729954e-05}, "score": 4.9083152574471836}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9027427228032119, "4": 0.09132058968441581, "3": 0.005821571712514948, "1": 0.00011031799489477035, "2": 3.2878917633544246e-06}, "score": 4.896584975087974}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9761585324212643, "4": 0.023057010790855162, "3": 0.0006723933812159828, "1": 0.00010720432124700842, "2": 0}, "score": 4.97516926450706}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9813557284020547, "4": 0.018074094662865785, "3": 0.00040392319882221313, "1": 0.0001618055908269833, "2": 0}, "score": 4.980470749707235}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9927489714825208, "4": 0.007032324313468387, "3": 0.0001349727029960887, "1": 8.216718868545357e-05, "2": 0}, "score": 4.992369049588607}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9434865025492739, "4": 0.05230927402591368, "3": 0.003749562921722953, "1": 0.0004264943237631508, "2": 1.4978271106306991e-05}, "score": 4.938439876173007}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9712886519544748, "4": 0.023097455939698516, "3": 0.005146913831250696, "1": 0.0004537807073838, "2": 1.042506036383759e-05}, "score": 4.964762220690189}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9748995899053899, "4": 0.023279365771087458, "3": 0.0017458430793040112, "1": 5.8613881720901514e-05, "2": 0}, "score": 4.972994044585849}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9795677784532164, "4": 0.019293751345040768, "3": 0.001102278696048265, "1": 3.2655280005078705e-05, "2": 0}, "score": 4.978370993657793}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9745104457551254, "4": 0.024881649875147543, "3": 0.0005574942882354847, "1": 4.460850598366147e-05, "2": 0}, "score": 4.973824775666907}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.96202162726951, "4": 0.03272025414532818, "1": 0.0027536664520730982, "3": 0.0024683040095359317, "2": 3.328039743250801e-05}, "score": 4.951228490971679}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9831197679894048, "4": 0.015263185905222375, "1": 0.0008913655012161507, "3": 0.0007213623363248026, "2": 2.856341350916302e-06}, "score": 4.979720028745384}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9879640712767497, "4": 0.011270849236981188, "3": 0.0005299451750874252, "1": 0.00023207591964038334, "2": 2.0004828130763985e-06}, "score": 4.986734941252622}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9917095905688743, "4": 0.007889701322794537, "3": 0.000282068671701372, "1": 0.00011530831696842239, "2": 0}, "score": 4.991084898368659}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9898120256128672, "4": 0.009285441829599754, "3": 0.0006151485958959505, "1": 0.00028331392485671496, "2": 2.514624675356086e-06}, "score": 4.988343443274405}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9838724739233884, "4": 0.015062341358537583, "3": 0.0008964885830726587, "1": 0.00016094723171912852, "2": 0}, "score": 4.982500756948498}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969649904814294, "4": 0.0029123743577231702, "1": 8.364791969482315e-05, "3": 3.509204820584812e-05, "2": 0}, "score": 4.996682836946096}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.992017914389441, "4": 0.00736219247483034, "3": 0.0004945272016609281, "1": 0.00012262495586466427, "2": 0}, "score": 4.991158229063287}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962859336696998, "4": 0.003653653694041701, "3": 4.053819264305371e-05, "1": 1.7522741611917394e-05, "2": 0}, "score": 4.9961951700063985}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9898908623310807, "4": 0.0097395963956942, "3": 0.0002917214935659525, "1": 7.39292502349639e-05, "2": 0}, "score": 4.9893812023034885}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9943862845199839, "4": 0.005283407656233517, "3": 0.0002979267223056508, "1": 3.0042545429129882e-05, "2": 0}, "score": 4.994000554687399}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.996551648667166, "4": 0.003200641565669581, "3": 0.00013349587226036484, "1": 0.00011202203107348639, "2": 0}, "score": 4.996084269982769}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9884623214423068, "4": 0.010708526346729462, "3": 0.0006487011013282879, "1": 0.00017572751023238678, "2": 0}, "score": 4.987291101377938}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980989926077944, "4": 0.0018241770958866603, "1": 4.403503459861475e-05, "3": 2.942464410142002e-05, "2": 0}, "score": 4.997940826536831}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9932462024027234, "4": 0.0062007315621293016, "1": 0.00029977840687193475, "3": 0.0002468304239073519, "2": 0}, "score": 4.992106442992257}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9693945496325153, "4": 0.029939835330173043, "3": 0.0006150048524661637, "1": 3.892289188859385e-05, "2": 0}, "score": 4.968674097282339}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9450183100139148, "4": 0.053771806065723834, "3": 0.0011285462262327385, "1": 6.436696643567053e-05, "2": 0}, "score": 4.94371267837926}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9896037039845906, "4": 0.010267065818511696, "3": 8.592660983957858e-05, "1": 3.5062618324964835e-05, "2": 0}, "score": 4.989420743305185}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9920758737371632, "4": 0.007832151736710615, "3": 6.85434299314495e-05, "1": 2.0321675153406022e-05, "2": 0}, "score": 4.991949449670262}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.964537484705654, "4": 0.0347761212048526, "3": 0.0006477256052370354, "1": 2.8484513623686524e-05, "2": 0}, "score": 4.9638141210142495}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8872272453952098, "4": 0.1062037457585669, "3": 0.006507909471911392, "1": 5.1628123752016834e-05, "2": 4.629688364568419e-06}, "score": 4.880559455458683}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8676507214040958, "4": 0.11825762164850484, "3": 0.0136804427848219, "1": 0.0003837089252387551, "2": 1.648984204952321e-05}, "score": 4.8527955660397195}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9812751457223547, "4": 0.018024902589758723, "3": 0.0006275576617154943, "1": 6.533876846965289e-05, "2": 0}, "score": 4.980458489142536}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.888195280227997, "4": 0.1062178824179012, "3": 0.004753160090153817, "1": 0.0007949327802733826, "2": 2.149429514786135e-05}, "score": 4.881029531132237}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8543694136906773, "4": 0.13125742600831108, "3": 0.013013981492925368, "1": 0.0013131689725192888, "2": 3.564766183253622e-05}, "score": 4.837353306756972}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5426432354161633, "3": 0.275618890227989, "5": 0.09973898054912135, "4": 0.06728575021771051, "2": 0.014707853149341194}, "score": 2.166764979154673}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6639131607907822, "4": 0.24301138132742983, "3": 0.08111902974077967, "1": 0.01139218141121262, "2": 0.0005581532453745819}, "score": 4.547504616536468}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9718092904624513, "4": 0.02350812906472188, "3": 0.0037483257701000296, "1": 0.0009283460462686248, "2": 3.9623827860736415e-06}, "score": 4.965269880467328}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912335830862384, "4": 0.00833409622476845, "3": 0.00036124505760552934, "1": 6.956986907138156e-05, "2": 0}, "score": 4.990665120127625}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9704321259656364, "4": 0.027271600308493227, "3": 0.0018321255196215207, "1": 0.00045848728426009364, "2": 2.887570692976347e-06}, "score": 4.967221445896699}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9829590675870186, "4": 0.015273973156212125, "3": 0.0015146867910121769, "1": 0.00023895196726913685, "2": 7.1730615504857646e-06}, "score": 4.980719207680581}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9706474868067103, "4": 0.02406356279032252, "3": 0.004347695258156205, "1": 0.000903344112656282, "2": 2.399094717059053e-05}, "score": 4.963555190086376}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9356641836804407, "4": 0.048324683660160545, "3": 0.012797563215103508, "1": 0.003094241424434595, "2": 8.995419154887474e-05}, "score": 4.913430818768981}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9882989421242451, "4": 0.010666791092464588, "3": 0.0007194870718788639, "1": 0.0003055891515978921, "2": 0}, "score": 4.98667175566336}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830539807988817, "4": 0.015715135286815226, "3": 0.0010043571438501672, "1": 0.0002110038876028251, "2": 8.340102929525934e-06}, "score": 4.98140698101672}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.986675934797908, "4": 0.012870672569977908, "3": 0.000303946457109401, "1": 0.00014346721726191718, "2": 0}, "score": 4.985947481627343}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9935799592930152, "4": 0.006152338657104048, "1": 0.00015350552470825196, "3": 0.00011154850937687302, "2": 0}, "score": 4.993010523717066}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9927740064453675, "4": 0.006953640107800153, "3": 0.00013591837992488835, "1": 0.00012993788881854565, "2": 0}, "score": 4.9922547212546196}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975302534548467, "4": 0.0023255383926943513, "1": 9.343589236364309e-05, "3": 4.960077992810809e-05, "2": 0}, "score": 4.997201513199622}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982916551850374, "4": 0.0016437247884186384, "1": 3.9299254843264476e-05, "3": 2.4191819963011263e-05, "2": 0}, "score": 4.998150692464503}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8250027824388434, "4": 0.16048105191269826, "3": 0.013730357797508929, "1": 0.0007131259536968833, "2": 6.968900500909301e-05}, "score": 4.808996090008348}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9597391981716923, "4": 0.0360444096283069, "3": 0.0036985256933333406, "1": 0.0005082575757543793, "2": 7.952255172720772e-06}, "score": 4.9545015765403555}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9741676460008283, "4": 0.023704793355598757, "3": 0.0019219543884714371, "1": 0.00019923709704636967, "2": 0}, "score": 4.971654168940194}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9855327766877633, "4": 0.013870787070701173, "3": 0.0003107530539334573, "1": 0.00027779197937529966, "2": 0}, "score": 4.984396415772798}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9908591370355175, "4": 0.008535216132286002, "3": 0.0005390242485682258, "1": 6.18520694815506e-05, "2": 0}, "score": 4.990139280051947}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9572024628289162, "4": 0.037985574870363824, "3": 0.004571937057935908, "1": 0.00023056055927308183, "2": 6.72598617570452e-06}, "score": 4.951927999163485}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9903012828897987, "4": 0.009500257267052031, "3": 0.0001711005778169899, "1": 2.4520084518042032e-05, "2": 0}, "score": 4.990059433016175}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9810949550131013, "4": 0.017836827470774707, "3": 0.0010064305668632, "1": 5.85735106658214e-05, "2": 0}, "score": 4.9799159528139825}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9869768438191628, "4": 0.012667654805576401, "3": 0.0003151052020921903, "1": 3.564085377931602e-05, "2": 0}, "score": 4.986559507461286}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9862242491731806, "4": 0.013113967439823685, "3": 0.0005062849018469546, "1": 0.0001533254149673493, "2": 1.2515922715837086e-06}, "score": 4.985256392733889}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6737799062425449, "4": 0.2928144052051931, "3": 0.028338720328245724, "1": 0.004965948313625319, "2": 9.194490674680396e-05}, "score": 4.63036517172616}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8311797183000915, "4": 0.14805480051535974, "3": 0.019003638844906176, "1": 0.0016797647922191354, "2": 7.966270690958084e-05}, "score": 4.806979408391278}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9293185809991887, "4": 0.06504722723933291, "3": 0.004348128744982402, "1": 0.0012713384955572416, "2": 1.2211456371615558e-05}, "score": 4.921134328724834}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8861795646557002, "4": 0.1017192003240617, "3": 0.008438131340854735, "1": 0.003634164656665831, "2": 2.034445835231889e-05}, "score": 4.866805700245528}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9453415265711641, "4": 0.04589340748540718, "3": 0.006736208832992773, "1": 0.002004705724136022, "2": 1.839646557713169e-05}, "score": 4.932559774442181}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"5": 0.944917185235467, "4": 0.03942892480164107, "3": 0.011321575923951027, "1": 0.004284566066878549, "2": 4.5884003925158514e-05}, "score": 4.920651859168761}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9795192890892175, "4": 0.020038583277499855, "3": 0.0004048256813229671, "1": 3.5496409764201716e-05, "2": 0}, "score": 4.979009741822001}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.990818990218343, "4": 0.008511883781204212, "3": 0.0005667538361037906, "1": 0.00010067560920909693, "2": 0}, "score": 4.989951889062577}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.996774859773987, "4": 0.0029162153978160386, "3": 0.0001656091605851329, "1": 0.0001422251774012734, "2": 5.820450422659843e-07}, "score": 4.9961819174949955}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9758345435414807, "4": 0.022428199626252514, "3": 0.0014604349159275361, "1": 0.0002716511096834822, "2": 4.549350875064491e-06}, "score": 4.973550661613438}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7932036347176364, "4": 0.17065824321344766, "3": 0.03234571578615072, "1": 0.0036668364183861657, "2": 0.0001183005663010815}, "score": 4.749626257800439}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9343273970517715, "4": 0.05320396262372894, "3": 0.010389682838360583, "1": 0.0020528914832288556, "2": 2.2797401449780013e-05}, "score": 4.9177364446755085}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9437055744097556, "4": 0.0479842714450794, "3": 0.00707872126412937, "1": 0.0012114362982276782, "2": 1.8275101469083777e-05}, "score": 4.932957600117103}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9562002111195494, "4": 0.03897204440546421, "3": 0.003936554620653875, "1": 0.0008787603823514554, "2": 8.98395813940226e-06}, "score": 4.949612679339193}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9048493076777473, "4": 0.07566426430091341, "3": 0.012732422321871158, "1": 0.006675369636328782, "2": 7.096881519607131e-05}, "score": 4.871955524315698}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8994753680618657, "4": 0.0866876370449914, "3": 0.012010338000867976, "1": 0.0016847710496304062, "2": 0.00013640734022998653}, "score": 4.882142735052751}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9797122782960597, "4": 0.019020709875117107, "3": 0.0009214597136879739, "1": 0.00033900489878331135, "2": 3.7302362071496403e-06}, "score": 4.977769097769741}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8928992735895065, "4": 0.07763041365756797, "3": 0.025560226193525694, "1": 0.003645032489930723, "2": 0.0002485113597978962}, "score": 4.8559210864606275}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9867382680456055, "4": 0.012400915232776795, "3": 0.00045892856124775166, "1": 0.00039822316250790244, "2": 1.8220779087941398e-06}, "score": 4.98508284126984}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9784391510769186, "4": 0.020441155171578358, "3": 0.0009963872208297233, "1": 0.00011152575580190369, "2": 5.097486412620653e-06}, "score": 4.977104521887233}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9973531766301985, "4": 0.0023907159433743707, "3": 0.00014582474995767023, "1": 0.00010846673737040948, "2": 0}, "score": 4.996883761948331}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9967354139868543, "4": 0.0031760163106987426, "3": 6.288656563370061e-05, "1": 2.472803346033153e-05, "2": 0}, "score": 4.996599295176168}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9950794139433908, "4": 0.004543166695744927, "3": 0.00021741751951033606, "1": 0.0001585269416860419, "2": 0}, "score": 4.994387882221179}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9968366768830512, "4": 0.003044118228159247, "1": 7.609066257754868e-05, "3": 3.906639200902087e-05, "2": 0}, "score": 4.996573372467093}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9866926512031997, "4": 0.012532136673386221, "3": 0.0004875167057053366, "1": 0.00028239521402283657, "2": 3.197171644780942e-06}, "score": 4.985353626742385}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.901446435668273, "4": 0.08345522654322429, "3": 0.012959220972646448, "1": 0.002111088685217602, "2": 2.546631396748806e-05}, "score": 4.882105275804039}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9799454148513982, "4": 0.01931854043295652, "3": 0.0006017416846553861, "1": 0.00012965357138544376, "2": 0}, "score": 4.978959264084139}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9769389852650474, "4": 0.020366416188200863, "1": 0.0013670201240836492, "3": 0.0013161006068854314, "2": 5.621359609043798e-06}, "score": 4.971516271209158}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9811651941151094, "4": 0.018291167242480852, "3": 0.00028752866452534523, "1": 0.0002496529012039152, "2": 0}, "score": 4.980135035554055}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9677170249880246, "4": 0.030665743325671017, "3": 0.001433801887664184, "1": 0.00017668077231165532, "2": 3.680827378279265e-06}, "score": 4.965748782238069}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9574540697570716, "4": 0.03938595493346699, "3": 0.002716042829717622, "1": 0.00041590528662808807, "2": 2.2418837336128167e-05}, "score": 4.9534508206842185}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9951093971329218, "4": 0.004770887178864183, "3": 6.496057568527175e-05, "1": 5.39647231433672e-05, "2": 0}, "score": 4.994883328733029}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9699205985501335, "4": 0.029268231509635236, "3": 0.0006599234595814616, "1": 0.0001476414291329544, "2": 2.795115858944645e-06}, "score": 4.968812945247585}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9852723278968908, "4": 0.013820490074770053, "3": 0.0006287255650808326, "1": 0.00026907914562038893, "2": 0}, "score": 4.98384559072756}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9692318116430002, "4": 0.02994914507210159, "3": 0.0006115768109585905, "1": 0.00019332071740941364, "2": 0}, "score": 4.968053966535533}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"5": 0.990529072437166, "4": 0.00864918311560641, "3": 0.0007067405023266065, "1": 0.0001109212575312044, "2": 0}, "score": 4.9894936079553025}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9983728001276228, "4": 0.0015677763518118447, "3": 4.261731209650407e-05, "1": 1.6102629118822358e-05, "2": 0}, "score": 4.998282577299177}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9939012368180569, "4": 0.005718265807876976, "3": 0.0003239507694042919, "1": 5.437386186461271e-05, "2": 0}, "score": 4.993416322901219}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983766047339387, "4": 0.0015337068438563434, "1": 4.759204178953839e-05, "3": 4.104625321180474e-05, "2": 0}, "score": 4.998193830585855}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995008271282537, "4": 0.0004658017237026261, "1": 2.0262209658741652e-05, "3": 1.2610711324783694e-05, "2": 0}, "score": 4.9994279277299905}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.694223447385872, "4": 0.22170353888342784, "3": 0.07742713332992807, "1": 0.006158136890658283, "2": 0.00048506691862416944}, "score": 4.5973533684176635}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9812695171442616, "4": 0.01764524388831526, "3": 0.0008336511737448511, "1": 0.0002454262655092204, "2": 3.4848205750439727e-06}, "score": 4.979695239890527}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9900178576360227, "4": 0.008870226034079916, "3": 0.0008655639484000348, "1": 0.00024010913711622383, "2": 3.0663795253477914e-06}, "score": 4.988428973622492}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902180456235089, "4": 0.009105323832391004, "3": 0.00045377730404125695, "1": 0.00021673199799192316, "2": 0}, "score": 4.9891201269692225}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9697425452326869, "4": 0.02863458574435492, "3": 0.0012720099395285055, "1": 0.0003393975241417423, "2": 6.6172346623974834e-06}, "score": 4.967443794863208}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9502532433159531, "4": 0.04484781991589518, "3": 0.004453627706354766, "1": 0.00042722113424272754, "2": 1.2731605932166166e-05}, "score": 4.944497548027644}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9898183356846438, "4": 0.009992239872418531, "3": 0.0001282609111935153, "1": 5.959338380727977e-05, "2": 0}, "score": 4.989512848303586}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9870353693332412, "4": 0.012470355640619973, "3": 0.0004546948606155605, "1": 3.739649778652517e-05, "2": 0}, "score": 4.9864706391033735}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9916516744365913, "4": 0.007921600581105751, "3": 0.00025278935625490465, "1": 0.00017250436801282022, "2": 0}, "score": 4.990882790185253}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.989784110337958, "4": 0.00970148803081035, "3": 0.0003892362781089959, "1": 0.00012291506125990695, "2": 1.630116619498945e-06}, "score": 4.989023482010707}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9922692640449889, "4": 0.007444356875418945, "3": 0.0002461410038151381, "1": 3.833788447046301e-05, "2": 0}, "score": 4.991909994206511}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9974473369992934, "4": 0.0023757495292994683, "3": 9.394068363819552e-05, "1": 8.199067800731711e-05, "2": 0}, "score": 4.997108403551529}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9970125084607033, "4": 0.0027110507191247016, "3": 0.00019246697064944314, "1": 8.243281170550697e-05, "2": 0}, "score": 4.996574278813589}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995035673634777, "4": 0.0003624454781807986, "1": 0.0001198637352474978, "3": 1.32795141456921e-05, "2": 0}, "score": 4.999131539819637}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962067816973741, "4": 0.00339799950977872, "3": 0.00020424485791251343, "1": 0.00018497830685587177, "2": 0}, "score": 4.995453570288271}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9725397084617259, "4": 0.025502211629755217, "3": 0.0017731187096749611, "1": 0.00017927636575722471, "2": 5.205712383691509e-06}, "score": 4.970218814081932}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9889551442887087, "4": 0.009762118916695019, "3": 0.0008471853975130666, "1": 0.00043194784766735684, "2": 3.1763081332505927e-06}, "score": 4.986806184336267}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9649401242282866, "4": 0.028520464407376975, "3": 0.005833343172546171, "1": 0.0006764297223047218, "2": 2.589783975189765e-05}, "score": 4.957029276101488}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964384768226612, "4": 0.0034879922320073388, "3": 4.6320404129845416e-05, "1": 2.6501081883844363e-05, "2": 0}, "score": 4.996313360016677}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9813331093945444, "4": 0.01688490080335806, "3": 0.0014638094924768427, "1": 0.0003099552889750012, "2": 7.292646837457361e-06}, "score": 4.978925761466209}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9923877081744846, "4": 0.006853718001602078, "3": 0.0005825920845232986, "1": 0.0001736291248389823, "2": 1.249763780635228e-06}, "score": 4.991282822424908}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9940377368583247, "4": 0.0057178295208403975, "3": 0.0001695894570769633, "1": 7.407814562496988e-05, "2": 0}, "score": 4.993646674115743}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9957990282729978, "4": 0.004015666270583536, "3": 0.0001337448068809855, "1": 5.0683659355380274e-05, "2": 0}, "score": 4.995514105544148}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9968644059755053, "4": 0.0030840827241082327, "3": 3.6219786502165485e-05, "1": 1.3693668297889807e-05, "2": 0}, "score": 4.996788697898532}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955838171400724, "4": 0.004094913439482618, "3": 0.00017942684174394467, "1": 0.00014033979063254217, "2": 0}, "score": 4.994984866177815}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9113871221478375, "4": 0.0699974266325972, "3": 0.018049577530312753, "1": 0.0005171761633529378, "2": 4.0694931762081784e-05}, "score": 4.891711762271263}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9811755160272446, "4": 0.01820976300281036, "3": 0.000520267737024598, "1": 8.650909543644409e-05, "2": 0}, "score": 4.980403509464179}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8265822257323655, "4": 0.15793269779912245, "3": 0.014684261573525158, "1": 0.0007466987753552229, "2": 3.4967272687265135e-05}, "score": 4.809603436259687}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9621135403201931, "4": 0.035637957044721745, "3": 0.0021060403624461417, "1": 0.00013251297404643522, "2": 0}, "score": 4.959619508576633}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9770998720310188, "4": 0.02218726507436925, "3": 0.0005855851232067072, "1": 0.00012001413865472512, "2": 0}, "score": 4.976161334969291}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"5": 0.955045348775517, "4": 0.0387769919197919, "3": 0.005480974310164628, "1": 0.0006689131010966144, "2": 2.5076284477613417e-05}, "score": 4.9475100367096445}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9886914849360743, "4": 0.009519156852642038, "3": 0.0012242945235768246, "1": 0.0005573502503219047, "2": 6.1464062287218e-06}, "score": 4.985784391603928}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9914637930862026, "4": 0.007612733295839621, "3": 0.0008217580905136674, "1": 9.919588761764874e-05, "2": 0}, "score": 4.990346942650436}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959422031969566, "4": 0.003810025488389095, "3": 0.00016467594250977024, "1": 8.185959781462334e-05, "2": 7.187508947256055e-07}, "score": 4.995531025672086}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9958634601478057, "4": 0.003701889181662427, "3": 0.0002907199864281478, "1": 0.00014212309637537287, "2": 1.1229695471324574e-06}, "score": 4.995144806227383}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9773724358966623, "4": 0.02211603871423454, "3": 0.0004670186805115516, "1": 4.3009781129919625e-05, "2": 7.377690512552406e-07}, "score": 4.976775653862111}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9268206552878506, "4": 0.06696409491675594, "3": 0.006134780375957378, "1": 7.470556280428188e-05, "2": 4.469808461648221e-06}, "score": 4.920454009718384}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9846914077701734, "4": 0.01489561506920648, "3": 0.00029623677732889484, "1": 0.00011418358615646314, "2": 0}, "score": 4.984055136263728}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9499736610333067, "4": 0.04865500003445673, "3": 0.001212973252456438, "1": 0.00015319299902074378, "2": 2.4718368987886495e-06}, "score": 4.948298726316783}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9659396933139819, "4": 0.03299519282818554, "3": 0.0006404855483229439, "1": 0.00042008562433530345, "2": 0}, "score": 4.964043330237996}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9484749453307201, "4": 0.048430495081450274, "3": 0.0026320546554136535, "1": 0.00044631882815579775, "2": 1.0587526447460886e-05}, "score": 4.944488046927768}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9526974413078966, "4": 0.04410444976142272, "3": 0.0026459203917612623, "1": 0.0005455516900418682, "2": 3.967057190398306e-06}, "score": 4.948409463787332}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9222807783066327, "4": 0.07405543830345714, "3": 0.0033358225111258196, "1": 0.00031460426831414923, "2": 9.905246417810443e-06}, "score": 4.917984500796434}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9581301023703594, "4": 0.040322506176316206, "3": 0.001203085707166421, "1": 0.00033441460582541186, "2": 5.503540200368822e-06}, "score": 4.955916959946697}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9823904065073303, "4": 0.01714486272168765, "3": 0.00043994686487146685, "1": 2.156959227829191e-05, "2": 0}, "score": 4.981888906964719}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9834891728585957, "4": 0.016182044752944266, "3": 0.00029311632912836676, "1": 3.263337566192426e-05, "2": 0}, "score": 4.983101137837249}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9775743731040533, "4": 0.021231670936111027, "3": 0.0010747562363494208, "1": 0.00011566065986927016, "2": 2.115843514823337e-06}, "score": 4.976149792477073}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9890596240176809, "4": 0.009852345798695834, "3": 0.000893866877927269, "1": 0.0001901127957707533, "2": 1.9397615593390135e-06}, "score": 4.98759362379095}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878834418794014, "4": 0.011563959003704091, "3": 0.0004776749871212778, "1": 6.983592470578079e-05, "2": 0}, "score": 4.98720128220073}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9964384768226612, "4": 0.003446303746846131, "3": 6.491089984830283e-05, "1": 4.805136572283868e-05, "2": 0}, "score": 4.996231660484802}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9707774506453916, "4": 0.02580868540762367, "3": 0.003076552583322013, "1": 0.00032743565351829265, "2": 8.037543952389487e-06}, "score": 4.9667042929767575}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9610985190929916, "4": 0.034224004334199074, "3": 0.0040721974957057105, "1": 0.0005903643909077955, "2": 1.2525675253393283e-05}, "score": 4.955232459134854}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9634793920419457, "4": 0.032549010831192375, "3": 0.0036217679079411204, "1": 0.0003332798601729429, "2": 9.54383654292143e-06}, "score": 4.95884541409324}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9865975011254183, "4": 0.012109173174589075, "3": 0.0008602435595789789, "1": 0.0004273988097265188, "2": 3.843542848181132e-06}, "score": 4.984449185228603}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8921202286525085, "4": 0.09596199992422148, "3": 0.010302836843181756, "1": 0.0015552701788295684, "2": 3.781990525095717e-05}, "score": 4.877095101162771}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9962381233538392, "4": 0.0037122927549277456, "3": 4.845693948787591e-05, "1": 8.826694987580711e-07, "2": 7.010960736599682e-08}, "score": 4.996187051695168}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9991037086092983, "4": 0.0008469570271156105, "3": 4.713998399391219e-05, "1": 1.901086486931946e-06, "2": 7.611488449064245e-08}, "score": 4.9990509301081785}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9896462004592824, "4": 0.01010920989342746, "3": 0.00022490577977914288, "1": 1.864232546094139e-05, "2": 0}, "score": 4.989366398169826}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995148678646674, "4": 0.0004828309333790263, "3": 1.8079227928062165e-06, "1": 3.622515416471307e-07, "2": 0}, "score": 4.9995121041509405}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9972768202990548, "4": 0.0026419328224083233, "1": 6.583032233636307e-05, "3": 1.526916687219257e-05, "2": 0}, "score": 4.997064207121797}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9141203575283564, "4": 0.07188734773828577, "3": 0.012746392354558298, "1": 0.0011878401749053527, "2": 4.80816957027121e-05}, "score": 4.897723240991836}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9912687249221465, "4": 0.008133442608256273, "3": 0.00032064755420957653, "1": 0.0002737536345573157, "2": 0}, "score": 4.990130213879087}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.981307627448539, "4": 0.016120879239464387, "3": 0.0022664977053588704, "1": 0.0002893223770580227, "2": 0}, "score": 4.978188493984844}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9791655271110407, "4": 0.019682158765598503, "3": 0.0008976293728211716, "1": 0.00024587556090422557, "2": 0}, "score": 4.977538882380898}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.924826432145737, "4": 0.06550240627452956, "3": 0.008784433889499958, "1": 0.0008255418494564393, "2": 3.7069945907555984e-05}, "score": 4.913513263005865}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8403931507774002, "4": 0.10718978757950531, "3": 0.05098367987094688, "1": 0.0012914372932931128, "2": 0.0001208533174765}, "score": 4.78531001549189}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9833574010223058, "4": 0.01505965447651622, "3": 0.001533140090549317, "1": 4.174599664531493e-05, "2": 0}, "score": 4.981706933942705}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9722114898879699, "4": 0.02677864332526351, "3": 0.0009226213001649704, "1": 8.213560147443441e-05, "2": 0}, "score": 4.97104742372417}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961523618020344, "4": 0.0036801785829617697, "3": 0.00014353222263394197, "1": 2.202436978879465e-05, "2": 0}, "score": 4.995944651775196}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.974097054525965, "4": 0.024206192260930067, "3": 0.0014726864927994403, "1": 0.00021043136816007054, "2": 0}, "score": 4.972006327577249}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8415029918334176, "4": 0.10632680093134934, "3": 0.05075691571996816, "1": 0.0012734716821890997, "2": 0.00011854084182719632}, "score": 4.78670531967884}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.917733706966545, "4": 0.07470031275785413, "3": 0.007283833322985625, "1": 0.0002516276858606713, "2": 1.7209740952569256e-05}, "score": 4.909672678416056}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.975121379439424, "4": 0.02417122506977286, "3": 0.0006128990607146689, "1": 8.64956875657883e-05, "2": 0}, "score": 4.974256788093724}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9613147261813296, "4": 0.034080714904374684, "3": 0.00430771533542135, "1": 0.00026626433553636106, "2": 1.6172472329333388e-05}, "score": 4.956189648499947}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9757783614849928, "4": 0.023508575723417354, "3": 0.0006184788885627853, "1": 8.628394623057206e-05, "2": 0}, "score": 4.974909122461335}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9998347339779339, "4": 0.0001599594839675781, "3": 3.136895316153461e-06, "1": 1.8302435729413665e-06, "2": 1.0089202009288429e-07}, "score": 4.999826143033582}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999040904456155, "4": 9.537309903874661e-05, "3": 2.68873453800717e-07, "1": 5.616775495255142e-08, "2": 0}, "score": 4.999903864462709}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997428656846962, "4": 0.00025369038276007726, "3": 2.798127820374821e-06, "1": 5.733755068803952e-07, "2": 0}, "score": 4.999738419840626}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998561836525626, "4": 0.00014309010803952005, "3": 4.1526996921025113e-07, "1": 2.5729604215402717e-07, "2": 0}, "score": 4.999855050160073}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996936631107295, "4": 0.0002915058452672464, "1": 1.046565096486942e-05, "3": 4.153035688193264e-06, "2": 0}, "score": 4.99965832540694}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9377818324829107, "4": 0.05238534512279994, "3": 0.0082188473895107, "1": 0.0015185487043581128, "2": 7.66904782547111e-05}, "score": 4.924871286247761}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9698686849394464, "4": 0.0267584330798806, "3": 0.002077686425003977, "1": 0.0012838336990196545, "2": 9.782123213352396e-06}, "score": 4.963921455909911}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9700621396904643, "4": 0.027149278704731043, "3": 0.0021023790384910785, "1": 0.0006741487999359951, "2": 9.611617835343042e-06}, "score": 4.965920449937713}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9421326376673408, "4": 0.05049838618217832, "3": 0.005817765649333284, "1": 0.0015209465616760408, "2": 2.406516978420835e-05}, "score": 4.931709677447118}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9948426746050669, "4": 0.0048456978932417735, "3": 0.0001956829129191336, "1": 0.00011509047497555426, "2": 0}, "score": 4.994302569514764}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9773724358966623, "4": 0.02211603871423454, "3": 0.0004670186805115516, "1": 4.3009781129919625e-05, "2": 7.377690512552406e-07}, "score": 4.976775653862111}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9943241724189643, "4": 0.005539659733805095, "3": 0.00012779092856943014, "1": 7.658204508925116e-06, "2": 0}, "score": 4.99417412140388}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9017705774470167, "4": 0.092077386306564, "3": 0.00590019427881433, "1": 0.00023883299881504052, "2": 1.1684586241165455e-05}, "score": 4.895131700496078}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9531145053760273, "4": 0.04484605743120554, "3": 0.0017419754389344307, "1": 0.00029092443443366067, "2": 3.152950111741137e-06}, "score": 4.950496667565298}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9691657462082603, "4": 0.029296931365404736, "3": 0.0010394183511742946, "1": 0.0004922223562353086, "2": 4.308895289687708e-06}, "score": 4.9666423700272935}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9975888500031425, "4": 0.002378738437766226, "1": 2.0173816646037525e-05, "3": 1.198196446506574e-05, "2": 0}, "score": 4.997516601731522}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969425954099026, "4": 0.0029883693746232034, "3": 4.2141270522800804e-05, "1": 2.6129620554176787e-05, "2": 0}, "score": 4.996822827173723}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998557069012507, "4": 0.00013992709793739735, "1": 3.5222203005590903e-06, "3": 7.668485597417352e-07, "2": 0}, "score": 4.999844450311774}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993871131918947, "4": 0.0006103203955987496, "1": 1.757878278011009e-06, "3": 6.77466318377718e-07, "2": 0}, "score": 4.99938129307756}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994834394633573, "4": 0.0005075687440325112, "3": 6.737679366287715e-06, "1": 2.074220785228373e-06, "2": 0}, "score": 4.999470658918869}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7741761092058627, "4": 0.18961691101909506, "3": 0.03469874360616341, "1": 0.0013804648344110026, "2": 0.00010655055399960372}, "score": 4.735138470200558}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.981279508481351, "4": 0.018194680642670966, "3": 0.00039972809679860637, "1": 0.00011817145259159639, "2": 0}, "score": 4.980533023343757}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.963200594706429, "4": 0.035665091418504574, "3": 0.000995550905656459, "1": 0.00013182200398765187, "2": 0}, "score": 4.961816253722169}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9491123951804843, "4": 0.04688704817425907, "3": 0.003304493731547117, "1": 0.0006670274890028849, "2": 1.5231498569522917e-05}, "score": 4.943789383983736}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9876488513717451, "4": 0.012050677458540805, "3": 0.0002473072666307051, "1": 4.514468516911493e-05, "2": 0}, "score": 4.987274027215173}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9002008399979908, "4": 0.09048241106845208, "3": 0.008741617830327354, "1": 0.0005340473780498138, "2": 3.5655505180876084e-05}, "score": 4.889790599002276}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.775259040244183, "4": 0.13344215378858112, "3": 0.08420410550127733, "1": 0.006784543287814444, "2": 0.00029816396638722355}, "score": 4.670113013753962}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9956562435191468, "4": 0.003796652202119975, "3": 0.0003263781106769919, "1": 0.0002190685200813086, "2": 1.1116157171102875e-06}, "score": 4.994670979739231}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9790938655877265, "4": 0.018749694875589917, "3": 0.0018272484917953669, "1": 0.0003175815252979496, "2": 6.833913921331314e-06}, "score": 4.976304867139253}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9130890477597565, "4": 0.0784094204533908, "3": 0.007147628182754799, "1": 0.0012975859530410484, "2": 4.9315259573061536e-05}, "score": 4.901956347050175}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9894810225016376, "4": 0.009454353081454429, "3": 0.0005568002499721109, "1": 0.0005024260967456506, "2": 4.304610071124245e-06}, "score": 4.987409414434102}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9957582443665515, "4": 0.003802330921150888, "1": 0.00027138963558484227, "3": 0.00016582276843380943, "2": 1.1945703225005917e-06}, "score": 4.994776875972902}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9915288283036867, "4": 0.008121700707524389, "3": 0.0003167039918448698, "1": 3.0944446794153826e-05, "2": 0}, "score": 4.991121097339363}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980517213635156, "4": 0.001874148230202977, "1": 4.88018175949805e-05, "3": 2.4491461778258982e-05, "2": 0}, "score": 4.997881659802541}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.989089597923764, "4": 0.010139238320114414, "1": 0.0005178261447169587, "3": 0.00024912170644759795, "2": 0}, "score": 4.98729116010886}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.992558799844341, "4": 0.0066982887209011705, "3": 0.0005704213270068268, "1": 0.0001701622779594688, "2": 1.2247908049745938e-06}, "score": 4.991476535739119}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9901073632561964, "4": 0.00939875542563713, "3": 0.0003881912218216892, "1": 0.00010266749453897554, "2": 0}, "score": 4.989414160155785}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.996022377380924, "4": 0.003808181882241392, "3": 0.00011937819441786834, "1": 4.9006334142195085e-05, "2": 0}, "score": 4.995757031910896}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964902017918065, "4": 0.0033239890374292974, "3": 0.0001133004973801963, "1": 7.173900180655074e-05, "2": 0}, "score": 4.996162451006931}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929036187722208, "4": 0.006853464418727332, "3": 0.00015940921224853345, "1": 8.143959322141417e-05, "2": 0}, "score": 4.992501943277881}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.977685236323789, "4": 0.021391154147576776, "3": 0.0007263230279623209, "1": 0.0001927269765242971, "2": 2.5933087186766174e-06}, "score": 4.976377465517254}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.881144031525804, "4": 0.11121566886864452, "3": 0.0073624096627118475, "1": 0.00023402420682192463, "2": 3.040416355147553e-05}, "score": 4.873030493278773}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.984710831492108, "4": 0.013474517094124044, "3": 0.0017242581137410572, "1": 8.830092277111167e-05, "2": 1.3567275107023232e-06}, "score": 4.982719680092513}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9945496901291663, "4": 0.005026180134368037, "3": 0.00023744750274415507, "1": 0.000182714633865862, "2": 0}, "score": 4.993768041598763}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9386358698680304, "4": 0.058302109660147206, "3": 0.002701713709746044, "1": 0.0003357151249612274, "2": 1.835668031224665e-05}, "score": 4.934896126459739}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8919959471199053, "4": 0.0834132424373147, "3": 0.021437475433839115, "1": 0.0029308417808402527, "2": 0.00019931760509510717}, "score": 4.861387274320087}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9762179412849643, "4": 0.020974815979347732, "3": 0.0021192824808826598, "1": 0.0006671086044772685, "2": 1.0164411574167388e-05}, "score": 4.972087393097561}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9183521006431656, "4": 0.0695414500911833, "3": 0.009203474529270743, "1": 0.0028321577557163854, "2": 6.032873703553484e-05}, "score": 4.900540940465456}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9735339613052503, "4": 0.024213227602586727, "3": 0.0015473244513529332, "1": 0.0006856275552844199, "2": 1.0811966802346363e-05}, "score": 4.969916905207834}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9847109496574149, "4": 0.014424674959193678, "3": 0.0006764808623247968, "1": 0.00018201635723652981, "2": 0}, "score": 4.9834942008634195}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8886571641262413, "4": 0.10520382710659323, "3": 0.005658185619974142, "1": 0.00044534245943611447, "2": 2.722241073011524e-05}, "score": 4.881615786933897}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9372391967246547, "4": 0.06035280823765446, "3": 0.002141149595557013, "1": 0.0002546437623313587, "2": 5.864308415690115e-06}, "score": 4.93432830841076}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9843208549265534, "4": 0.01484755609506352, "3": 0.0007663065288945526, "1": 6.315276029426954e-05, "2": 1.621579311448834e-06}, "score": 4.98336234661428}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970548134962627, "4": 0.0028825931230334043, "3": 4.928232798004341e-05, "1": 1.2811402029451738e-05, "2": 0}, "score": 4.996967595097746}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9533087174751252, "4": 0.04491529034501637, "3": 0.0015804546818804668, "1": 0.00018350695303290658, "2": 6.580663380523988e-06}, "score": 4.951169764369948}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9915650445555357, "4": 0.008202563923389847, "3": 0.00021943093980237907, "1": 8.406713038771664e-06, "2": 0}, "score": 4.991324907839624}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9972735063536872, "4": 0.0026827810963567637, "3": 2.6807013685589113e-05, "1": 1.3263933143922689e-05, "2": 0}, "score": 4.997210538985587}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9770093010250217, "4": 0.021554686825003503, "3": 0.0012312796309762975, "1": 0.0001799310204938543, "2": 0}, "score": 4.9752624163019235}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960469785410372, "4": 0.003849038123304152, "1": 5.1061743532234125e-05, "3": 5.08109335081175e-05, "2": 0}, "score": 4.995845084265942}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9933546433937046, "4": 0.0065382979478954065, "3": 0.000100170181842833, "1": 4.7251511883315105e-06, "2": 0}, "score": 4.993242446464879}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9787240934931006, "4": 0.01992695382783328, "3": 0.0011423488974543264, "1": 0.0002018214827624339, "2": 0}, "score": 4.976980952362243}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.980700398736875, "4": 0.018038751032068825, "3": 0.0011405147310666625, "1": 0.00011452401717259512, "2": 0}, "score": 4.979222002686132}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9233146992409493, "4": 0.07118128117323827, "3": 0.005306316901115611, "1": 0.00018558714534599657, "2": 7.507687968298189e-06}, "score": 4.91744083295887}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9919131638205743, "4": 0.007670081790270882, "3": 0.0002438417764944988, "1": 0.00017108141562537722, "2": 9.848544235963767e-07}, "score": 4.991154946945022}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9752823569866462, "4": 0.023741198658126354, "3": 0.0008856134404722463, "1": 8.458082262230818e-05, "2": 0}, "score": 4.974149089599868}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9866476205648759, "4": 0.012274590086921064, "3": 0.0009285586618567761, "1": 0.00014131614702961586, "2": 0}, "score": 4.985302911680563}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9987104769503095, "4": 0.001249797925920243, "3": 2.6028486112096606e-05, "1": 1.2660065088370084e-05, "2": 0}, "score": 4.99864750343954}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958016289051359, "4": 0.0040638507267625225, "1": 6.777053801571306e-05, "3": 6.255539961480903e-05, "2": 0}, "score": 4.995539937614523}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994187804335692, "4": 0.0005537581050792944, "1": 1.6574387099197688e-05, "3": 1.0528275662247325e-05, "2": 0}, "score": 4.999358887565169}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99391183414771, "4": 0.005912721871695516, "3": 0.0001354115362310398, "1": 3.6590862763335757e-05, "2": 0}, "score": 4.993670069819818}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8373028717528117, "4": 0.12456118973509027, "3": 0.037023279074612496, "1": 0.0009024959096601762, "2": 0.00018623858335615226}, "score": 4.797218701195662}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8979110221990315, "4": 0.08976090992037973, "3": 0.009906719645687144, "1": 0.0023183420091900725, "2": 8.030111914982692e-05}, "score": 4.880908675412821}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9696651570471838, "4": 0.028108032202010084, "3": 0.0018070438516733672, "1": 0.00039962286224545605, "2": 9.9263174464872e-06}, "score": 4.9666492689249075}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9781250589355729, "4": 0.02062580123001621, "3": 0.0010331540202575746, "1": 0.00020612557242733986, "2": 5.14355542858515e-06}, "score": 4.976467846779689}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8353114914851422, "4": 0.12965095513473937, "3": 0.02953919362450912, "1": 0.005125911070003784, "2": 0.0003636383966095437}, "score": 4.789674245115714}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8644671443152884, "4": 0.13029662460284955, "3": 0.004724478946454068, "1": 0.0004887909328963443, "2": 0}, "score": 4.858296000078418}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9387417539659023, "4": 0.057745006549154515, "3": 0.003193685819084047, "1": 0.00030297326217362754, "2": 1.3406579018025985e-05}, "score": 4.934615301507361}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9220026179540676, "4": 0.07368163475888027, "3": 0.003913856789392355, "1": 0.00038437550714605156, "2": 1.3697092142927068e-05}, "score": 4.916911741134793}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969761287362183, "4": 0.0028753323828190095, "1": 8.18145056002734e-05, "3": 6.150402119529361e-05, "2": 0}, "score": 4.996674384191496}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.937638958238798, "4": 0.05880083050162531, "3": 0.003244076373511798, "1": 0.00029991543691285495, "2": 1.2486243995364474e-05}, "score": 4.933473647915194}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9972090067837173, "4": 0.002297170800416957, "1": 0.000282602850802312, "3": 0.00020778493074478599, "2": 0}, "score": 4.996156834735017}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9972240630581262, "4": 0.0025264818932263173, "3": 0.00012979256964220054, "1": 0.00011856656798105947, "2": 0}, "score": 4.996739663122526}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9626602992614537, "4": 0.03572677040217863, "3": 0.001496893976551012, "1": 0.00010928100124344212, "2": 0}, "score": 4.960842053113773}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984902092824791, "4": 0.001426811135474858, "1": 5.647000193576504e-05, "3": 2.4403719469692993e-05, "2": 0}, "score": 4.998298497834717}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9952756301092405, "4": 0.004573399854562587, "1": 7.96279019121072e-05, "3": 6.704500149058923e-05, "2": 0}, "score": 4.994973976937319}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9882583139898513, "4": 0.011420553595111382, "3": 0.00023049163197100432, "1": 8.803271950802914e-05, "2": 0}, "score": 4.987766300356648}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9765704850104928, "4": 0.021702908394940105, "3": 0.0014824235451359898, "1": 0.00023512788508211715, "2": 4.045796973652993e-06}, "score": 4.974379467240879}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9644579647617879, "4": 0.03217294812089026, "3": 0.0030897410319964277, "1": 0.00026739569310215057, "2": 8.670448832997017e-06}, "score": 4.960551846308498}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931545969476053, "4": 0.006134909207698004, "1": 0.000512257310292649, "3": 0.00019648076882882422, "2": 1.1304994858808088e-06}, "score": 4.991419703150046}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987827666302617, "4": 0.001077680750684088, "1": 0.00010954216657022264, "3": 2.9577281743067216e-05, "2": 0}, "score": 4.998424995337303}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9079693740223103, "4": 0.07293229747602598, "3": 0.017439683650011965, "1": 0.0015799024094843733, "2": 6.186054379554686e-05}, "score": 4.8856812140365}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9643662742440073, "4": 0.03223364165279773, "3": 0.0024125005422121694, "1": 0.0009726025871141781, "2": 1.2051468960762598e-05}, "score": 4.959014672440721}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9412681398205803, "4": 0.05343846360892614, "3": 0.004080768297838899, "1": 0.0011776766760199864, "2": 2.4841423395111595e-05}, "score": 4.9336140976481575}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9696315306122716, "4": 0.02945959251055607, "3": 0.0007105009310590782, "1": 0.00019400201739727292, "2": 2.818662715080423e-06}, "score": 4.968334892321926}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9724599897316405, "4": 0.026474944071480384, "3": 0.0008922885421011686, "1": 0.0001674380710732651, "2": 2.907223662682353e-06}, "score": 4.971061934501241}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9080574331621217, "4": 0.074820916555263, "3": 0.015961804969946532, "1": 0.0010766025319911409, "2": 7.745170322953099e-05}, "score": 4.888716063813297}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9976174435040533, "4": 0.002251843646150957, "3": 9.176019133293577e-05, "1": 3.772958587734199e-05, "2": 0}, "score": 4.997413714464458}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9907130892179904, "4": 0.008506437918446212, "3": 0.0005658454916376925, "1": 0.0002039354572928445, "2": 0}, "score": 4.989546017496019}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9925380104217221, "4": 0.0069277416439154135, "1": 0.0003271934407644609, "3": 0.00019768019694550333, "2": 0}, "score": 4.9913680432806125}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9891553785256967, "4": 0.010553903368004254, "3": 0.000190680748921511, "1": 9.413920188364218e-05, "2": 0}, "score": 4.988688111607341}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7168862486444901, "4": 0.23073707965374668, "3": 0.049820317311968974, "1": 0.0021494426564639614, "2": 0.0003964815698749837}, "score": 4.659831522374011}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9660735055139253, "4": 0.030788568823100885, "3": 0.0018966775147054634, "1": 0.0012249585160596032, "2": 1.3436724034681942e-05}, "score": 4.960477819157993}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9099858946281503, "4": 0.08538891393684413, "3": 0.0031519341459094103, "1": 0.0014549045236445727, "2": 1.0590999725722147e-05}, "score": 4.902455069556683}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.983942055845132, "4": 0.015107809249589342, "1": 0.0005522202983992181, "3": 0.000392825721969048, "2": 3.223054646850401e-06}, "score": 4.981887955154934}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9823336937638297, "4": 0.01630269903349645, "1": 0.0007947738096149241, "3": 0.0005636671163227998, "2": 3.3748522917666096e-06}, "score": 4.979380710000623}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9773507902690183, "4": 0.020770108857810055, "3": 0.0014091959295277213, "1": 0.00045660019353843434, "2": 7.936628460705736e-06}, "score": 4.974561152064769}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9825166301702859, "4": 0.01574199180254263, "3": 0.0012329507485519997, "1": 0.0004983584304344023, "2": 7.629784170708778e-06}, "score": 4.979775734297824}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9796944320197426, "4": 0.018267336585136115, "3": 0.001907388976822895, "1": 0.00012429037451204422, "2": 3.700021231823068e-06}, "score": 4.977409559471029}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9790134187081038, "4": 0.019793046298722222, "3": 0.0010178446252076137, "1": 0.0001669642233392271, "2": 4.186451835858567e-06}, "score": 4.977490746016901}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970235283014568, "4": 0.002860077947932273, "1": 7.817731828432111e-05, "3": 3.718281000962973e-05, "2": 0}, "score": 4.996752843802578}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9219432336779363, "4": 0.05997691144908533, "3": 0.012021344510688682, "1": 0.005922959733730804, "2": 0.00011681208797365986}, "score": 4.891936099370904}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9811214684814139, "4": 0.01760025831600498, "3": 0.0010936407620252865, "1": 0.00017860569555942066, "2": 3.928682225068668e-06}, "score": 4.979486208291808}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9141385834417384, "4": 0.06201101800298399, "3": 0.02296515986461502, "1": 0.000814464268605386, "2": 5.6819839855228046e-05}, "score": 4.8886287915351145}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9829143793518305, "4": 0.015097928952975667, "3": 0.001555638199288983, "1": 0.0004130383963310685, "2": 0}, "score": 4.980138263390224}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9857934658542206, "4": 0.0133620363644499, "3": 0.0006170234674606113, "1": 0.00022396920348568324, "2": 1.9020505821583103e-06}, "score": 4.984502308891213}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8873556222687984, "4": 0.09829116832155331, "3": 0.013895947890699867, "1": 0.00041697095119283957, "2": 2.0999414533219257e-05}, "score": 4.87218358812269}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9616155676618817, "4": 0.036718252655375566, "3": 0.0014530034790586348, "1": 0.0001882951272923572, "2": 0}, "score": 4.959621555218169}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9386889136797754, "4": 0.056867589767595206, "3": 0.003912821319884538, "1": 0.00048651442802248156, "2": 0}, "score": 4.933357766905904}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9774245908587224, "4": 0.021006850083419692, "3": 0.0013508017147780135, "1": 0.00020793604531292717, "2": 0}, "score": 4.975459561286817}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9443946535502576, "4": 0.05369533246285499, "3": 0.001703863430852864, "1": 0.00019095839134707508, "2": 0}, "score": 4.942132227973328}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9735401714981968, "4": 0.023529171199591453, "3": 0.001780601589764377, "1": 0.0011260196480434043, "2": 1.9240762163957576e-05}, "score": 4.96834767295974}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9922081282499838, "4": 0.007229268670517126, "3": 0.00037797500079299513, "1": 0.00017722995283861155, "2": 0}, "score": 4.991305797195736}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9882721655154515, "4": 0.010742920494549727, "3": 0.0005063005969221842, "1": 0.00047257537497331014, "2": 3.748971583476859e-06}, "score": 4.986342898635222}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9797515283155647, "4": 0.018329828012809364, "1": 0.0009755153134227248, "3": 0.0009296526836600433, "2": 1.0120980615849325e-05}, "score": 4.975878361503617}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.923112709315396, "4": 0.07432086096328437, "3": 0.0015654968959262542, "1": 0.0009721839718138337, "2": 0}, "score": 4.918657070841648}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7065493343972755, "4": 0.25753501179120214, "3": 0.03491272161515815, "1": 0.0009080995035132529, "2": 8.328667379839604e-05}, "score": 4.668753462364199}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9198738480737985, "4": 0.06980776702323123, "3": 0.007811326368785091, "1": 0.0024373385333856415, "2": 5.8153179670756575e-05}, "score": 4.904644663608524}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9638484801432768, "4": 0.034585443276350554, "3": 0.001231384171054631, "1": 0.00032425996590158243, "2": 7.830415376556372e-06}, "score": 4.961631157434998}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9759084560488399, "4": 0.02318179515352333, "3": 0.0007899443958344754, "1": 0.00010733798108406828, "2": 0}, "score": 4.974808650084504}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9499564476665223, "4": 0.04547206034445099, "3": 0.0035869572447643668, "1": 0.000935813456462942, "2": 4.236254325345225e-05}, "score": 4.943483324335304}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9986321286899651, "4": 0.0012527471739550797, "3": 5.949596873862483e-05, "1": 5.374375950120812e-05, "2": 0}, "score": 4.9984132828605405}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9939554018363407, "4": 0.005476326771189671, "3": 0.00031019575252929315, "1": 0.0002491680473945715, "2": 0}, "score": 4.992906546348578}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958771688006194, "4": 0.003919414494435664, "3": 0.00014507960009472302, "1": 5.539603705903918e-05, "2": 0}, "score": 4.995568829124765}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9956969049590799, "4": 0.004088525039531701, "3": 0.00011263241570340864, "1": 9.980452849249485e-05, "2": 0}, "score": 4.9952869819619545}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9863905415859551, "4": 0.012245439463523498, "3": 0.0011292193790280014, "1": 0.0002297393850435925, "2": 0}, "score": 4.984577086195427}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9513914440830075, "4": 0.04211147542584451, "3": 0.006167615392295469, "1": 0.00030859803053195163, "2": 1.593430859686348e-05}, "score": 4.94427082384301}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986712387859852, "4": 0.0012814300475925227, "3": 3.687565429015029e-05, "1": 1.011409057437533e-05, "2": 0}, "score": 4.998604361805029}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9555396400281124, "4": 0.042710563524957015, "3": 0.0016076919499372544, "1": 7.717901224547426e-05, "2": 0}, "score": 4.953762334523342}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997727675712, "4": 0.0002095307607552065, "1": 1.3333458567500759e-05, "3": 3.2936539051149376e-06, "2": 0}, "score": 4.999730547807622}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9593017240154441, "4": 0.03622483665370682, "3": 0.0037067244126382233, "1": 0.0007543512874337917, "2": 1.0612415167482318e-05}, "score": 4.953312390365708}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9651215326529443, "4": 0.03101301263975225, "3": 0.003451375264425293, "1": 0.00038714277706075536, "2": 1.5100586104939766e-05}, "score": 4.960489896320103}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9491279664461704, "4": 0.046708799777126164, "3": 0.003583490333630368, "1": 0.000523038334114172, "2": 0}, "score": 4.944028892371399}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9785377631435427, "4": 0.01864494155456758, "3": 0.002630342008479858, "1": 0.0001699741825159996, "2": 0}, "score": 4.975414060251012}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9894615378331891, "4": 0.010017026338258721, "3": 0.00037986410029941444, "1": 0.00013994612931682147, "2": 9.648125530688877e-07}, "score": 4.988660559013268}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.985548181670993, "4": 0.013114830367271223, "3": 0.0009565246484463966, "1": 0.00037624478592645084, "2": 3.165346593971232e-06}, "score": 4.98345762773024}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.997700377791823, "4": 0.001295996217048983, "1": 0.0009067534273412723, "3": 9.60198132279809e-05, "2": 5.569290410599397e-07}, "score": 4.994883278146371}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986107308291419, "4": 0.000978898106512516, "1": 0.00034256813011505715, "3": 6.732533119043925e-05, "2": 2.7362836043754845e-07}, "score": 4.99751535731876}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9914224300795934, "4": 0.007932725559933, "3": 0.00047412507489052026, "1": 0.00016575529229938182, "2": 0}, "score": 4.990455955744517}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974996484991352, "4": 0.0019399456922195386, "1": 0.0004485943189109184, "3": 0.00011018067936312742, "2": 0}, "score": 4.996045309224059}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994590266788609, "4": 0.0004591358601905893, "1": 6.585916233304454e-05, "3": 1.551835563772402e-05, "2": 0}, "score": 4.999246390432584}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8804899632780981, "4": 0.10942958455546051, "3": 0.009956639140725367, "1": 0.00011187593766961487, "2": 8.67233919688479e-06}, "score": 4.8701831925755465}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9388641457062991, "4": 0.06023528914455512, "3": 0.0008168438560790971, "1": 7.924664345372895e-05, "2": 0}, "score": 4.93781375830783}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.896837188577699, "4": 0.09598474561346122, "3": 0.006795386859732634, "1": 0.00034400364662258936, "2": 2.4715820828570535e-05}, "score": 4.888972768735499}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8908609181928009, "4": 0.10572472465266203, "3": 0.002701481372357658, "1": 0.000700746543853026, "2": 7.826790733406668e-06}, "score": 4.886045355771126}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9636803890249027, "4": 0.035239572820284094, "3": 0.0009544213665643012, "1": 0.00012302450435938337, "2": 1.6433577511109003e-06}, "score": 4.9623545206331166}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9665851285588789, "4": 0.03063226848474903, "3": 0.0021555809702422713, "1": 0.000605276971839888, "2": 0}, "score": 4.9626346491773194}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9834040850563114, "4": 0.014935678472346012, "3": 0.0010641192683828525, "1": 0.000587130761848221, "2": 5.684672728301166e-06}, "score": 4.980570441773409}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9900846989679493, "4": 0.009025669452065729, "3": 0.0005697661753400808, "1": 0.0003145646306735655, "2": 0}, "score": 4.988576479121057}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961941227789877, "4": 0.0034909024309130936, "3": 0.00015989439370437024, "1": 0.00015172801727012227, "2": 0}, "score": 4.995582381903066}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9905007714448183, "4": 0.008498491515500146, "3": 0.0006270265335281687, "1": 0.0003673079356531523, "2": 3.5361181510097585e-06}, "score": 4.98876758312319}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8467564414924448, "4": 0.13142533280487687, "3": 0.019819033800142723, "1": 0.00189965117836257, "2": 9.312051905057097e-05}, "score": 4.821057484476581}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9838568944261148, "4": 0.01507339966821101, "3": 0.0009291698545166106, "1": 0.00013238529309156252, "2": 0}, "score": 4.982538577126556}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9732653672439926, "4": 0.02454222930747586, "3": 0.001814097826740337, "1": 0.0003665068670420011, "2": 7.804321025730091e-06}, "score": 4.970340016132958}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952385531996552, "4": 0.004475077092631593, "3": 0.0002368446777074105, "1": 4.63732395009929e-05, "2": 0}, "score": 4.994865724411789}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9733889058173038, "4": 0.02462055046567362, "3": 0.0018829893221155858, "1": 0.00010118591405282082, "2": 5.405670839276141e-06}, "score": 4.971192482485199}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9893182336130016, "4": 0.010204022231505266, "3": 0.0003847091360433395, "1": 8.886288448298114e-05, "2": 0}, "score": 4.988671060692612}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9943292402038884, "4": 0.005571499785370033, "3": 8.591956414644903e-05, "1": 1.1174993490169259e-05, "2": 0}, "score": 4.994211948578623}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9743636292758348, "4": 0.022742151093337708, "3": 0.00274848342841875, "1": 0.00013794782831176412, "2": 3.4505807767562774e-06}, "score": 4.971198614059788}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972688775194498, "4": 0.0022535022891821146, "1": 0.00028922923025005075, "3": 0.0001871582579165127, "2": 7.594996315746781e-07}, "score": 4.99621298398306}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992805592616812, "4": 0.0006839388807245785, "1": 2.15524512668855e-05, "3": 1.3392991636868165e-05, "2": 0}, "score": 4.999203064887508}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9723925937826647, "4": 0.022970603252518915, "1": 0.00278865187179811, "3": 0.0018250425082995687, "2": 1.85918917445796e-05}, "score": 4.96216875769635}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.974217877327994, "4": 0.023909677157689213, "3": 0.0013614554059557251, "1": 0.0004990957484291239, "2": 5.848367473647303e-06}, "score": 4.971353310736594}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9681972904733803, "4": 0.02824921244023675, "3": 0.0026964359405146528, "1": 0.0008411998436509899, "2": 1.0048521989457862e-05}, "score": 4.9629627554488005}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9819789438161212, "4": 0.01712225841850618, "3": 0.0006805358877076852, "1": 0.0002087074598813113, "2": 4.634088658323351e-06}, "score": 4.98066784258}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9675682315490116, "4": 0.026605146618797867, "3": 0.004237643256514193, "1": 0.001560036594473488, "2": 2.3962151338397145e-05}, "score": 4.9586073279078}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9759997487474198, "4": 0.02164063893051562, "3": 0.0021494304046757373, "1": 0.00020029145043555725, "2": 5.680041607465687e-06}, "score": 4.973242181671771}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9887776081643298, "4": 0.010456160005839472, "3": 0.0006307055781213146, "1": 0.00013063988363927354, "2": 0}, "score": 4.987759809493285}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8967009568010524, "4": 0.08366772325938299, "3": 0.018383585590258406, "1": 0.0011343263823091038, "2": 7.724827287820826e-05}, "score": 4.874791527712169}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9704233688256441, "4": 0.026824645656574046, "3": 0.0022695257273515896, "1": 0.00046574233776878755, "2": 7.956638072698995e-06}, "score": 4.9667491723190915}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9938471776146416, "4": 0.005626799899171872, "3": 0.0003375967236897566, "1": 0.00018227044724144784, "2": 0}, "score": 4.992968881585733}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"5": 0.973317194031383, "4": 0.024339671203450673, "3": 0.0017684645407256823, "1": 0.0005698302776404935, "2": 3.4587891043133968e-06}, "score": 4.9698336605727516}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9307167972301685, "4": 0.060968636668878015, "3": 0.007273766744143727, "1": 0.0010128760707951872, "2": 2.3440951525220666e-05}, "score": 4.9203616457393355}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9756691818979495, "4": 0.02209860488116837, "3": 0.0014039676709956543, "1": 0.0008235496654210128, "2": 2.4812849672890844e-06}, "score": 4.9717917547902895}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9925606781643911, "4": 0.006977869765341433, "3": 0.0003123744279822843, "1": 0.00014783067899232943, "2": 8.634429585212002e-07}, "score": 4.991803465190311}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9499941075364473, "4": 0.04850972430511376, "3": 0.0012082196095588229, "1": 0.0002801663567419083, "2": 0}, "score": 4.947952766007225}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9893273304359823, "4": 0.010489803383303183, "3": 0.00016551818334967604, "1": 1.600543829560312e-05, "2": 0}, "score": 4.989115123883226}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995168933536139, "4": 0.0004641517554735438, "3": 1.0568993340866935e-05, "1": 7.908400571347794e-06, "2": 0}, "score": 4.99948307640873}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983736332700721, "4": 0.0015618436946770297, "3": 3.945810822916109e-05, "1": 2.4398619625276136e-05, "2": 0}, "score": 4.998261644452085}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991391707262892, "4": 0.0008134126602556266, "1": 3.261174690458576e-05, "3": 1.4133834855006588e-05, "2": 0}, "score": 4.999027872030088}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929321724100177, "4": 0.006899274623045628, "3": 0.0001465976204831302, "1": 2.0098788868764782e-05, "2": 0}, "score": 4.992727121477996}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9888606086514217, "4": 0.009885635846973589, "3": 0.0011190748072613704, "1": 0.00012825873077655864, "2": 3.6652152247422616e-06}, "score": 4.987352149102782}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9962341003531724, "4": 0.003574552090700761, "3": 0.0001700437161753126, "1": 2.0191415886306466e-05, "2": 0}, "score": 4.9960045903688135}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.981706352879726, "4": 0.01709900507354218, "3": 0.001067878829932537, "1": 0.00011913645989848718, "2": 0}, "score": 4.980288541092495}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960236795814315, "4": 0.0037570056820546752, "3": 0.0002017028466130156, "1": 1.6507726730050425e-05, "2": 0}, "score": 4.995773553051111}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.992941346450619, "4": 0.006881162316184317, "3": 0.00015775600353388689, "1": 1.7592005360491036e-05, "2": 0}, "score": 4.992732942080371}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9815726437638663, "4": 0.01689027950077602, "3": 0.0008188167071106885, "1": 0.0007141832327833882, "2": 2.9145634769297653e-06}, "score": 4.978606585599328}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.986180767504595, "4": 0.012651405035201724, "3": 0.000766695834836453, "1": 0.0003964125880834156, "2": 3.4828940020125198e-06}, "score": 4.984219084753314}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9712914667530668, "4": 0.025938747130691168, "3": 0.002418808295446571, "1": 0.0003414644445136654, "2": 5.900986604091627e-06}, "score": 4.967839959365951}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9949669332403913, "4": 0.004544090869836162, "1": 0.0003777052985056269, "3": 0.00010983080639283453, "2": 7.993475536214538e-07}, "score": 4.993723024260685}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973032647410078, "4": 0.002607346086658183, "3": 4.7449479614354165e-05, "1": 4.106271605992312e-05, "2": 0}, "score": 4.997133501576021}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9675222499289994, "4": 0.030413806879738468, "3": 0.0018462107198219829, "1": 0.00020085968063266919, "2": 1.0818153016445869e-05}, "score": 4.965057666935868}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9261162798752467, "4": 0.06288443513695653, "3": 0.010304758501442073, "1": 0.000628068701617153, "2": 3.2633310395238196e-05}, "score": 4.91389296059716}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918640236758729, "4": 0.00775146826509729, "3": 0.00035614272305368273, "1": 2.5596882275719334e-05, "2": 0}, "score": 4.99143383504466}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990139154133784, "4": 0.009496984042406802, "3": 0.0002452780728035554, "1": 0.00011564805354440158, "2": 0}, "score": 4.989549836919291}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9769327240831549, "4": 0.02205533844595033, "3": 0.0008971360815484599, "1": 0.00010618146431816996, "2": 0}, "score": 4.975725454288916}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9652185853281443, "4": 0.03357592455316241, "3": 0.000921786152527468, "1": 0.0002793016995493417, "2": 0}, "score": 4.963463135498567}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9758589543479043, "4": 0.023411802580387008, "3": 0.0006656405818422561, "1": 5.991851512621681e-05, "2": 0}, "score": 4.975017150159236}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9888630511401415, "4": 0.010673321166612043, "3": 0.0004193572818804947, "1": 4.0113163928673384e-05, "2": 0}, "score": 4.9883274630882894}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.993561255127621, "4": 0.006138157274666726, "3": 0.0002221109558110971, "1": 7.674065023193801e-05, "2": 0}, "score": 4.993110646252922}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9831089311199298, "4": 0.016421776328883395, "3": 0.00029813832538869313, "1": 0.00016546373682429873, "2": 0}, "score": 4.982319991465149}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9238842590080892, "4": 0.07041068864492922, "3": 0.004490075779393076, "1": 0.0011910230920571484, "2": 2.03162398323091e-05}, "score": 4.915783812394434}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9953418833342617, "4": 0.0044765648555096784, "3": 0.00010621820946136728, "1": 7.306434987327394e-05, "2": 0}, "score": 4.995018730022323}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9970345483637145, "4": 0.0028313631637365997, "1": 7.462373035981946e-05, "3": 5.8242513347607345e-05, "2": 0}, "score": 4.99675365292035}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9802024823662008, "4": 0.018979441726701365, "3": 0.0005869828235372449, "1": 0.00022513800235011145, "2": 0}, "score": 4.9789459152380395}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9968242514909984, "4": 0.003049238474591427, "1": 7.232555741830563e-05, "3": 5.318125889980547e-05, "2": 0}, "score": 4.996555093321943}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9917236600526373, "4": 0.006982073104012371, "3": 0.0012171651154766414, "1": 7.03628593544573e-05, "2": 4.032750131421336e-06}, "score": 4.9902900207008685}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9674007493418043, "4": 0.02768319855987067, "3": 0.0036353786703901656, "1": 0.001228771118096908, "2": 3.631219219302932e-05}, "score": 4.9600213997793015}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9302849555032012, "4": 0.06002336355321852, "3": 0.009388722913157822, "1": 0.00028709051748397667, "2": 1.3468485619925083e-05}, "score": 4.920010231196031}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9958031684156443, "4": 0.004104535488382621, "3": 8.34439424054886e-05, "1": 7.477649898774821e-06, "2": 0}, "score": 4.995698660115005}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9880123631528094, "4": 0.011469572725693135, "3": 0.00044678873665766195, "1": 6.53914527459507e-05, "2": 0}, "score": 4.987375209706599}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9754434030528519, "4": 0.023325719173288427, "3": 0.0009791979889271882, "1": 0.00023940904107350842, "2": 0}, "score": 4.973757926674803}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9920429066115714, "4": 0.007567768780188235, "3": 0.00025816038987883593, "1": 0.0001271949002800418, "2": 0}, "score": 4.991407096730968}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9953757790848246, "4": 0.004444355121806132, "3": 0.00014755242818766906, "1": 2.9878272917180934e-05, "2": 0}, "score": 4.995141015098073}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943708553443417, "4": 0.005471535439599028, "3": 9.193084025218605e-05, "1": 6.106235516976951e-05, "2": 0}, "score": 4.994100326226202}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9831303690270184, "4": 0.0159551758131332, "3": 0.000826254269078189, "1": 8.268411948072236e-05, "2": 0}, "score": 4.982061480208077}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7701600335115307, "4": 0.21015244143832373, "3": 0.017246018047120712, "1": 0.0023567104721852147, "2": 8.055422482468257e-05}, "score": 4.74568593902615}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.959548514059178, "4": 0.03849139381304872, "3": 0.0015850432261592566, "1": 0.00035953860547144676, "2": 8.421841905590917e-06}, "score": 4.956874794095981}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9545887905897252, "4": 0.04242492651410251, "3": 0.002349775940123394, "1": 0.0006154305215668286, "2": 9.5749619193199e-06}, "score": 4.9503845039823595}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9851764133488133, "4": 0.014067483212655118, "3": 0.000558591958705436, "1": 0.0001923657596437095, "2": 0}, "score": 4.984045787735447}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9806681803159141, "4": 0.018483996043946002, "3": 0.0004320291911053171, "1": 0.0004060245224757429, "2": 0}, "score": 4.979027642585548}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9885450295447871, "4": 0.011034528145470878, "3": 0.0003750493277417157, "1": 4.0101572899282404e-05, "2": 0}, "score": 4.988054903701058}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945559373132103, "4": 0.005286647378000062, "3": 0.00010600132117656744, "1": 4.972767195636103e-05, "2": 0}, "score": 4.994302429683919}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958342598675347, "4": 0.003947304650300385, "3": 0.00014242970189685427, "1": 7.311960740649381e-05, "2": 0}, "score": 4.9954753444573425}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9953591295734164, "4": 0.004461327105163432, "3": 0.00011821258341344626, "1": 6.0135151732925296e-05, "2": 0}, "score": 4.995061701216915}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9790975254474363, "4": 0.01953690964886416, "3": 0.0011348619107363206, "1": 0.00022264232453996673, "2": 4.660051772080103e-06}, "score": 4.977288739843898}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8358213708169373, "4": 0.14308029540203102, "3": 0.019079792276445646, "1": 0.0018391256693426085, "2": 0.00017322781154266122}, "score": 4.810882763671139}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9853887644073941, "4": 0.014416037166170398, "3": 0.0001721443825237971, "1": 2.1799991022091077e-05, "2": 0}, "score": 4.985152455485087}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998323492910694, "4": 0.0016322704814342446, "3": 2.5597650193706332e-05, "1": 1.8287185304422465e-05, "2": 0}, "score": 4.998243384859031}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9823301259343331, "4": 0.01709056025107874, "3": 0.0003068547651502845, "1": 0.00027072256685641455, "2": 9.948140516663121e-07}, "score": 4.981209841572972}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99054451292469, "4": 0.009278781914617234, "3": 0.00014192369556018943, "1": 3.2080586266265e-05, "2": 0}, "score": 4.99030902217504}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9250014351105967, "4": 0.07310579795367142, "3": 0.0016631574582506082, "1": 0.0002214217066085234, "2": 0}, "score": 4.922681567237782}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9498481379074115, "4": 0.04868217657345951, "3": 0.0010124690776930768, "1": 0.0004507782610542086, "2": 3.502922282424614e-06}, "score": 4.9474791092977215}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8746712478207854, "4": 0.118305738635323, "3": 0.006770759582841126, "1": 0.00023580178497998087, "2": 1.2249370623094364e-05}, "score": 4.867172228697925}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9386556189744922, "4": 0.05714576469850998, "3": 0.0033393136069972914, "1": 0.0008418567406024687, "2": 1.4482551180892519e-05}, "score": 4.9327645342240665}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9216489779275407, "4": 0.07411899772389278, "3": 0.0038500339982775237, "1": 0.00036735477040059967, "2": 1.079265227803411e-05}, "score": 4.916678817043842}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9889333459796583, "4": 0.01024376552412944, "3": 0.0006473072448893557, "1": 0.00017064980931776877, "2": 0}, "score": 4.9877789604814735}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9951606246930023, "4": 0.0046045791649412665, "1": 0.00013208168513393487, "3": 0.00010025561333285271, "2": 0}, "score": 4.994666569753786}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9743946447381422, "4": 0.022603231414104568, "3": 0.0025453431628868423, "1": 0.00044849420383219604, "2": 5.329724551579836e-06}, "score": 4.970496029035081}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902579096337689, "4": 0.009327422142460183, "3": 0.0002656884968202589, "1": 0.00014681709464911685, "2": 1.1763395701977392e-06}, "score": 4.989550393160221}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9855016304020651, "4": 0.01345440119590301, "3": 0.000563250156950716, "1": 0.00047634903768417337, "2": 2.155357402784474e-06}, "score": 4.983507199754666}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8012567551647154, "4": 0.18122698003805104, "3": 0.015525777063745595, "1": 0.001939316863764722, "2": 4.8885144553483255e-05}, "score": 4.779817039668005}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9863177022931453, "4": 0.013205577509970408, "3": 0.00024213527509192768, "1": 0.0002329140631767002, "2": 0}, "score": 4.985378471256631}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9931197947387961, "4": 0.006746952213440947, "3": 0.00010395275925010339, "1": 2.7147950566869774e-05, "2": 0}, "score": 4.992936535262827}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912414307135805, "4": 0.008579582725984884, "3": 0.00010714055364860838, "1": 7.008449306646328e-05, "2": 0}, "score": 4.990925782210093}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9889305463133188, "4": 0.010909495742040098, "3": 0.00011207222818672095, "1": 4.6060076624177844e-05, "2": 0}, "score": 4.988682098832677}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9912262004060047, "4": 0.006961395652177922, "3": 0.0012425432397442787, "1": 0.0005582301083683656, "2": 0}, "score": 4.988320461594894}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9869849765418627, "4": 0.012286879417161882, "3": 0.00040532149133073016, "1": 0.0003058951994900562, "2": 0}, "score": 4.985678654379783}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9932480853013341, "4": 0.005843443590577146, "3": 0.0005935595571013326, "1": 0.00030637430027583793, "2": 0}, "score": 4.991743869609462}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991659433187988, "4": 0.0007627936567631284, "1": 4.1806614053741746e-05, "3": 2.8523050731320354e-05, "2": 0}, "score": 4.999012932864271}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998504627018165, "4": 0.00010299099507632497, "1": 4.278290688442405e-06, "3": 7.064531145574194e-07, "2": 0}, "score": 4.999878477885291}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8743410343058434, "4": 0.10888539194067137, "3": 0.014276292280596861, "1": 0.002343397920772917, "2": 0.00011415687032317684}, "score": 4.852840115030151}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9755135097140036, "4": 0.023543518955106285, "3": 0.000780938934532746, "1": 0.00015902629373715297, "2": 1.5250673270411355e-06}, "score": 4.974253884667993}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9497979074666915, "4": 0.04671810976863157, "3": 0.0029676570783253955, "1": 0.0005019707534648028, "2": 1.1537591817351418e-05}, "score": 4.945303926187912}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974694010776531, "4": 0.002503423709989795, "3": 1.3596624426007611e-05, "1": 1.2500898953023351e-05, "2": 0}, "score": 4.997419376664237}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9917411323939935, "4": 0.0078237758162689, "3": 0.00026580755193318856, "1": 0.00016654750065696325, "2": 1.2265294035409574e-06}, "score": 4.990974725858988}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9581863596727195, "4": 0.037685770352837065, "3": 0.003165287785599704, "1": 0.00093736669709028, "2": 1.620968751014461e-05}, "score": 4.952185127613691}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9784049063059179, "4": 0.01911468291983224, "1": 0.001449961028220732, "3": 0.0010238044882884207, "2": 5.219953834888116e-06}, "score": 4.973022165677591}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9963998940768185, "4": 0.002772139151390726, "1": 0.0005728101056088008, "3": 0.0002534872581257631, "2": 0}, "score": 4.994429636610713}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989527327674991, "4": 0.0009013508279049817, "1": 0.0001000393449357085, "3": 4.53558224703723e-05, "2": 0}, "score": 4.998607779421734}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975198115623115, "4": 0.0022723803149232937, "3": 0.00012182316889077932, "1": 8.495991508002845e-05, "2": 5.967485509301278e-07}, "score": 4.9971423422174155}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9563564230074078, "4": 0.040539016428760566, "3": 0.0027148597076185805, "1": 0.0003796212169032529, "2": 7.857115528374866e-06}, "score": 4.9524891023477045}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9524070186133059, "4": 0.043322324477075215, "3": 0.0039005293667250507, "1": 0.0003536329666748695, "2": 1.225918629961711e-05}, "score": 4.947425084688611}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9794762783620432, "4": 0.019360886652811476, "3": 0.0009298632738413301, "1": 0.00022863333381966124, "2": 3.3523498844138927e-06}, "score": 4.97785477457877}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902022715756827, "4": 0.009128079107446117, "3": 0.00048260309095351367, "1": 0.00018388794140186782, "2": 2.037098635393814e-06}, "score": 4.989165039501128}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9582433811232104, "4": 0.03960479825525357, "3": 0.0020582030143642986, "1": 8.93876525479223e-05, "2": 3.204427854705969e-06}, "score": 4.955911586608414}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.992271256027536, "4": 0.006988369582104669, "1": 0.00045679840103034436, "3": 0.0002798952869275393, "2": 0}, "score": 4.990624611731905}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9893146146935221, "4": 0.01044987460672259, "3": 0.00011463653499466733, "1": 0.00010706129896675731, "2": 0}, "score": 4.988892453700374}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9950617018864745, "4": 0.004601814024829865, "1": 0.00020771948879924883, "3": 0.00011898632350344669, "2": 0}, "score": 4.9943292799230985}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9830999494777632, "4": 0.015789842901564828, "1": 0.0007845219551604009, "3": 0.0003191999018104629, "2": 0}, "score": 4.980433542570752}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9780174124154831, "4": 0.020546698661926637, "1": 0.0007309920308382354, "3": 0.0006957410649285431, "2": 0}, "score": 4.975137623449249}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7963778657968168, "4": 0.14457574816857627, "3": 0.05413324888121304, "1": 0.004251898882274726, "2": 0.0006559804311691214}, "score": 4.7281807880644795}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9318639046620119, "4": 0.06439740124658137, "3": 0.0035803310885879746, "1": 0.00014618713652275766, "2": 1.1000289140624983e-05}, "score": 4.927824102314394}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8601119274546886, "4": 0.1289696208037163, "3": 0.010532782950050768, "1": 0.00035258529265571643, "2": 2.7952497677843028e-05}, "score": 4.848469837131076}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8806306503980225, "4": 0.10418334492606617, "3": 0.011456248240048152, "1": 0.0036589659456444748, "2": 6.478969467800047e-05}, "score": 4.8580730740527605}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9479028366169298, "4": 0.03760906376711404, "3": 0.008988637493442314, "1": 0.005452434896930659, "2": 4.382741601424783e-05}, "score": 4.922472191336011}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9198653668760175, "4": 0.07559172949464901, "3": 0.004149364869275339, "1": 0.00037303425726657193, "2": 1.5602537448201402e-05}, "score": 4.914570177351359}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9027760472631473, "4": 0.09124368448846946, "3": 0.005501057128670219, "1": 0.00045581387528858516, "2": 1.4418405612620167e-05}, "score": 4.89588675572016}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9847462019556965, "4": 0.014423319103473733, "3": 0.0006426514815722446, "1": 0.00018301837505994178, "2": 0}, "score": 4.983559225368072}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9818696428773687, "4": 0.017666506856456356, "3": 0.0003752629041127448, "1": 8.622537931679887e-05, "2": 0}, "score": 4.981238021502582}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.950337542119595, "4": 0.04722570675549178, "3": 0.001599761057421755, "1": 0.0008210186767406587, "2": 8.268619429887179e-06}, "score": 4.946265476659667}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9883822078409569, "4": 0.010783037299347894, "3": 0.0007181096390118417, "1": 0.0001127310121968244, "2": 1.7794539684825462e-06}, "score": 4.9873244539527555}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9933958223732525, "4": 0.006327133430354563, "3": 0.00017785427904596645, "1": 9.633652765704797e-05, "2": 0}, "score": 4.992931791732573}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9865745225506176, "4": 0.01267923960285911, "3": 0.0004595508309407509, "1": 0.0002794956022052678, "2": 0}, "score": 4.98528357049451}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872246031381531, "4": 0.01233609205356357, "3": 0.00027173125858222, "1": 0.00016047040899891602, "2": 0}, "score": 4.986478467747931}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997917102148635, "4": 0.0019717220125603447, "3": 5.775139806139937e-05, "1": 5.229655808778737e-05, "2": 0}, "score": 4.99770358636888}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9752074191694832, "4": 0.021551468950480844, "3": 0.002951592570182984, "1": 0.00027509804405523677, "2": 9.018369546863404e-06}, "score": 4.971417744197329}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.991820279469627, "4": 0.007553526036812041, "3": 0.00040243442243773927, "1": 0.00022160345767197284, "2": 0}, "score": 4.990755171350102}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9455332234526648, "4": 0.04817018585659673, "3": 0.005925526708278303, "1": 0.000346180341668066, "2": 1.822023077839497e-05}, "score": 4.938538969127791}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979704048193554, "4": 0.0018935517133697208, "1": 7.872569207272094e-05, "3": 5.5505802118522995e-05, "2": 0}, "score": 4.997680529711285}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9682482480377145, "4": 0.030122878888213567, "3": 0.0014512529387148165, "1": 0.00016452451031215336, "2": 0}, "score": 4.966316076081071}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9945261110278977, "4": 0.005282345798014941, "3": 0.00016639867372692587, "1": 2.4199235892263002e-05, "2": 0}, "score": 4.994288054511663}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9829371832299554, "4": 0.01647452550366211, "3": 0.00048076787149007694, "1": 0.00010094386375959099, "2": 0}, "score": 4.982160045919787}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998721414887349, "4": 0.0012177431626910192, "3": 3.0053603120338192e-05, "1": 2.989829806771175e-05, "2": 0}, "score": 4.998602555195003}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975513646104956, "4": 0.0023580247045816996, "1": 5.903695229642372e-05, "3": 2.9726549170258767e-05, "2": 0}, "score": 4.99734636948615}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99863724000187, "4": 0.0013089414786073713, "1": 2.8982278528227942e-05, "3": 2.3614656513259478e-05, "2": 0}, "score": 4.998527898295957}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9687429168306446, "4": 0.028429555168345753, "3": 0.0024311278342096193, "1": 0.00037639704536684455, "2": 1.1565829960557854e-05}, "score": 4.965167609600855}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9814607822672384, "4": 0.016670504812241346, "3": 0.0013571513113969141, "1": 0.0005072048969591258, "2": 3.5237704184922707e-06}, "score": 4.978575783820749}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.98364024347965, "4": 0.015142398834948577, "3": 0.0010281913408886011, "1": 0.00018573065967048937, "2": 1.9322527649733377e-06}, "score": 4.982052472103407}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9898969333503561, "4": 0.009104367823579946, "3": 0.0007692445720081639, "1": 0.0002240998156010477, "2": 3.076293791472266e-06}, "score": 4.988451488579446}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9857283642318929, "4": 0.01359568657704051, "3": 0.0005526427980266972, "1": 0.00011835700913175203, "2": 2.332065971991248e-06}, "score": 4.984818563857819}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9448591842191538, "4": 0.03422005853397909, "1": 0.014460145500888985, "3": 0.006348404864976762, "2": 0.00010544521806054315}, "score": 4.8949255036000014}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.998250071812916, "4": 0.0017038787656927488, "3": 2.450483776770273e-05, "1": 1.5456112527726628e-05, "2": 0}, "score": 4.9981852760597665}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9904324738188818, "4": 0.008827009470882134, "3": 0.0005079515443871003, "1": 0.00022352953611549624, "2": 0}, "score": 4.989262872279171}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991947448920517, "4": 0.0007332878000900391, "1": 3.815895868062877e-05, "3": 3.13825987060904e-05, "2": 0}, "score": 4.999051308866488}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973416774138346, "4": 0.0024390499018367225, "1": 0.00013827708825636895, "3": 7.554432408472005e-05, "2": 0}, "score": 4.996856735962182}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9920673141434507, "4": 0.0072395878572430895, "3": 0.000497545026466847, "1": 0.0001910420494422703, "2": 0}, "score": 4.991001113298765}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.972056014593038, "4": 0.025355216272357217, "3": 0.002507868725214088, "1": 7.369489709794168e-05, "2": 3.6412082302692916e-06}, "score": 4.969323233722808}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9796753183678282, "4": 0.01963397490210567, "3": 0.0005412780800463709, "1": 0.00014381799232851054, "2": 0}, "score": 4.9787080775067984}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.982935681303087, "4": 0.01639647838225008, "3": 0.0004264721466349258, "1": 0.00023752706098283523, "2": 0}, "score": 4.981800399173935}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9895741677236244, "4": 0.010121751064518871, "3": 0.00021927037512828416, "1": 8.259082178628718e-05, "2": 0}, "score": 4.98910932072061}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9596604835907874, "4": 0.034555173516252674, "3": 0.005428040911041817, "1": 0.00033070527073083953, "2": 1.7256597911387155e-05}, "score": 4.953213763582495}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9392294349031213, "4": 0.05558499434681451, "3": 0.0038114846264827597, "1": 0.0013236436555850181, "2": 2.6329962728754337e-05}, "score": 4.93141681817736}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9582742562223453, "4": 0.037020395073505886, "3": 0.00428325304860938, "1": 0.00040168060502606475, "2": 9.827774973861081e-06}, "score": 4.952776393114912}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9723460347951668, "4": 0.026429213728867477, "3": 0.0008762150555098637, "1": 0.000338394020603406, "2": 0}, "score": 4.97046448051665}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9490209127476462, "4": 0.04887514470328338, "3": 0.0019055942057713963, "1": 0.00018278298191921725, "2": 0}, "score": 4.9465817034824076}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7972784329070728, "4": 0.18145367355105482, "3": 0.019824104157459856, "1": 0.001302480702741571, "2": 0.00010431274581709993}, "score": 4.773366872580964}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9345655781157022, "4": 0.06024748200095342, "3": 0.004434739953507554, "1": 0.0007191530915709188, "2": 2.0199776863086157e-05}, "score": 4.927944900698874}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.799251183723844, "4": 0.17788115859662856, "3": 0.021677921039949016, "1": 0.001073367903910874, "2": 9.273116035185779e-05}, "score": 4.774185996531259}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9905545699741843, "4": 0.009042861654225036, "3": 0.00029548455199421053, "1": 9.717005209410699e-05, "2": 0}, "score": 4.989977389671582}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9569911741361261, "4": 0.03997823891618536, "3": 0.0027091923888479465, "1": 0.00031560156821794637, "2": 4.895089491118947e-06}, "score": 4.953326242856353}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9965232339964882, "4": 0.0033286235792589665, "3": 0.00010954315245415828, "1": 3.800947831492812e-05, "2": 0}, "score": 4.996300250020485}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9929427557332722, "4": 0.006947745920477378, "3": 7.972207773911647e-05, "1": 2.6511737460389085e-05, "2": 0}, "score": 4.99278673942629}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9942305982897487, "4": 0.005449447781151622, "3": 0.00019917872912825283, "1": 0.00011834351720176564, "2": 0}, "score": 4.993678805320645}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995279703410699, "4": 0.0004340816100289954, "1": 2.680578059132098e-05, "3": 9.935473731571643e-06, "2": 0}, "score": 4.999438823642916}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9909723313215411, "4": 0.008747529161785571, "3": 0.0001849520418011612, "1": 9.11960475582681e-05, "2": 0}, "score": 4.990517744716646}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9570144139919761, "4": 0.037273897359609565, "3": 0.005185349674194263, "1": 0.000504553337636402, "2": 1.9425886998978493e-05}, "score": 4.950278794950866}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936869519548732, "4": 0.005789600430817795, "3": 0.00032818601218706614, "1": 0.0001935654228605024, "2": 1.1427624785947966e-06}, "score": 4.992776333568232}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9956836702437774, "4": 0.0038177711318047947, "3": 0.000250266051491942, "1": 0.0002469632544036133, "2": 9.025596994067256e-07}, "score": 4.994691133802892}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9901097018925504, "4": 0.009321366880877105, "3": 0.000419880252682465, "1": 0.00014573509530807683, "2": 1.908215587440883e-06}, "score": 4.989250192453657}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9965203904214971, "4": 0.0031812906492078865, "3": 0.00016645659054232434, "1": 0.00013007946825548065, "2": 9.752490135932937e-07}, "score": 4.9959625492889135}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9792137570968527, "4": 0.018689788010151347, "3": 0.0017812516279693959, "1": 0.0003055204017734278, "2": 0}, "score": 4.976525399825474}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9908010872717533, "4": 0.008612471084805865, "3": 0.00033860307730059375, "1": 0.00024242334515772856, "2": 0}, "score": 4.9897405738229015}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9856257503219378, "4": 0.012180475232681648, "3": 0.001642801931739873, "1": 0.0005472405991801685, "2": 2.358058375014723e-06}, "score": 4.982337860066755}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938579005878416, "4": 0.005889383239260547, "3": 0.00015089746372285684, "1": 9.948984294152937e-05, "2": 0}, "score": 4.993410847116272}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9856028259192114, "4": 0.01383784152682398, "3": 0.0003585971300615409, "1": 0.00019556025818900919, "2": 0}, "score": 4.984662643806938}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9899937866344645, "4": 0.008877032107243459, "3": 0.0008283205838089903, "1": 0.0002966919983069472, "2": 2.22016508995593e-06}, "score": 4.988272875386208}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9911819272852964, "4": 0.007961976547199278, "3": 0.0005858715443562188, "1": 0.00026386709753594697, "2": 3.1264637013551804e-06}, "score": 4.989801399630531}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9393118934746775, "4": 0.05238935275499181, "3": 0.007754383365169437, "1": 0.0005162220786970494, "2": 2.2446115223923486e-05}, "score": 4.929969254524105}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9880962716895573, "4": 0.010920456560169944, "3": 0.0007005136544102192, "1": 0.0002756602303686016, "2": 0}, "score": 4.986575779926227}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9515361617271504, "4": 0.04333897211194519, "3": 0.003787246655578869, "1": 0.0013097900785387616, "2": 2.041154266941647e-05}, "score": 4.94378572264374}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8639981943957491, "4": 0.13068925145859622, "3": 0.004261706977566392, "1": 0.0010086736792282549, "2": 2.1477278405623694e-05}, "score": 4.856685241961747}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9863673449123478, "4": 0.013075261097689219, "3": 0.00042711054100798426, "1": 0.0001235461237449969, "2": 0}, "score": 4.985576236147727}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9650372570948406, "4": 0.03387598238186883, "3": 0.0006834035661839633, "1": 0.0003832147580318303, "2": 0}, "score": 4.96322361069628}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9945677308274387, "4": 0.005163534259176164, "3": 0.00016212498627249847, "1": 0.00010092246592872423, "2": 0}, "score": 4.994108492396843}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9599575348786844, "4": 0.03804117702544946, "3": 0.0012057698938516828, "1": 0.000781498443333844, "2": 0}, "score": 4.95642067844194}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9951535398711864, "4": 0.004508750116084646, "3": 0.0002509366603201625, "1": 8.592643798653073e-05, "2": 0}, "score": 4.994645666276666}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9985465364028391, "4": 0.0013987196451298485, "1": 3.371711452875262e-05, "3": 2.0595807959267994e-05, "2": 0}, "score": 4.99842521960206}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9846693356673021, "4": 0.014700364346917644, "3": 0.0005069612435485568, "1": 0.00011967545748078564, "2": 0}, "score": 4.983806952016316}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9929530990732423, "4": 0.006872325701348987, "3": 0.0001217578891687822, "1": 5.0134758900782444e-05, "2": 0}, "score": 4.992683599857901}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9988483004156159, "4": 0.0011160486754271698, "1": 2.100561027433343e-05, "3": 1.39090618303615e-05, "2": 0}, "score": 4.998772109855796}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9611608521976025, "4": 0.03191055966456911, "3": 0.006679000021630865, "1": 0.00023674261964641045, "2": 8.311304349350933e-06}, "score": 4.953759326236433}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9976522071869374, "4": 0.0023166101593928776, "3": 2.4356933637394404e-05, "1": 4.040439842546023e-06, "2": 0}, "score": 4.997618507580838}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9924502962697418, "4": 0.007342903076804159, "3": 0.0001589339262958319, "1": 4.432104222033302e-05, "2": 0}, "score": 4.99216191711035}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9858201102400863, "4": 0.013659910183602757, "3": 0.00037805521559865327, "1": 0.00013545866764603885, "2": 0}, "score": 4.985042048001089}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990708641143058, "4": 0.000917703962764998, "3": 7.210069264404766e-06, "1": 1.2744332346833194e-06, "2": 0}, "score": 4.999062775403371}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9938243337034973, "4": 0.005841819339040391, "3": 0.00018671503133973777, "1": 0.00014509410878015488, "2": 0}, "score": 4.993204360314888}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9860648497546969, "4": 0.013078578712251316, "3": 0.00044510929464963635, "1": 0.0004066719569891438, "2": 0}, "score": 4.984404440163373}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9696051909295028, "4": 0.02581132060892852, "1": 0.002474268208536607, "3": 0.0020948138164224345, "2": 1.0452054458259223e-05}, "score": 4.960070464864065}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.983400397297907, "4": 0.01527330111617824, "3": 0.0008426717996730757, "1": 0.0004660302554909413, "2": 0}, "score": 4.981176902984837}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9927416887027793, "4": 0.006399281887436624, "1": 0.0005437014320056874, "3": 0.0003117518622142991, "2": 2.0629408420026676e-06}, "score": 4.990796205910637}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7804382173057219, "4": 0.19405128484175296, "3": 0.020280608414381902, "1": 0.00499139075317241, "2": 0.00016240521803426755}, "score": 4.74491530938422}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9376779460772331, "4": 0.057431519853714356, "3": 0.0036070258877509706, "1": 0.0012258542880996346, "2": 2.383682271563394e-05}, "score": 4.930377146309287}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8823697086481441, "4": 0.10894568758194331, "3": 0.0080480552547377, "1": 0.0006034476289894846, "2": 2.298832683004741e-05}, "score": 4.872474156799475}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9860967292535784, "4": 0.013332436210666586, "3": 0.00043057006272918135, "1": 0.00013267725937502332, "2": 0}, "score": 4.985275602909229}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9737727507632742, "4": 0.024109452390703185, "3": 0.0016205105906222268, "1": 0.0004828632841353007, "2": 7.387471744580857e-06}, "score": 4.970695704705922}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9830860082362304, "4": 0.015527044018845056, "3": 0.0008028842510892119, "1": 0.0005760925114549334, "2": 5.050870264096364e-06}, "score": 4.980547608019199}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9862131177229007, "4": 0.011243966559694927, "3": 0.0014180796241722439, "1": 0.0011144402701273133, "2": 8.357025463357945e-06}, "score": 4.981437004188869}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9840861086184148, "4": 0.01381233839060922, "1": 0.0012543283863012736, "3": 0.0008389809981212225, "2": 4.444318584833472e-06}, "score": 4.979478975146907}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962448779708378, "4": 0.003083865612326879, "1": 0.0005966066735354961, "3": 7.214417576359849e-05, "2": 0}, "score": 4.994385405274258}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9893861387896271, "4": 0.008969772191008403, "1": 0.001325498054479177, "3": 0.00030889751584846364, "2": 0}, "score": 4.985110296226794}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.937086846818356, "4": 0.058596477214483134, "3": 0.004109682105742758, "1": 0.00017896782802161886, "2": 1.73620199314947e-05}, "score": 4.932415480479924}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8749916548362529, "4": 0.12109925262434251, "3": 0.0036442561806902386, "1": 0.00024261408611774528, "2": 1.9030073772910773e-05}, "score": 4.870584275327764}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.942987183159906, "4": 0.0524944305381284, "3": 0.004325601816304593, "1": 0.00017527051106689073, "2": 6.9278017699223045e-06}, "score": 4.938131845432708}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9685717783255491, "4": 0.03027062828908174, "3": 0.0010278086165009534, "1": 0.00012404687991211146, "2": 0}, "score": 4.967177378625711}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9681729309359963, "4": 0.03122383604644823, "3": 0.0004981088153945434, "1": 9.538492603628607e-05, "2": 0}, "score": 4.967398089099604}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9728742496243166, "4": 0.025542291765584244, "3": 0.001412541097205803, "1": 0.00016415474630445385, "2": 4.566287712069807e-06}, "score": 4.970962244410833}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9875361828671442, "4": 0.012038758006845273, "3": 0.0003999749651259808, "1": 2.217289413511821e-05, "2": 0}, "score": 4.987072562851145}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8988805888261511, "4": 0.09267718066333981, "3": 0.008376371110367875, "1": 5.1890024107301834e-05, "2": 1.0936420590709746e-05}, "score": 4.890329375131604}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9322858363071777, "4": 0.060830425242696835, "3": 0.006592227338103791, "1": 0.000275004801623787, "2": 1.3850697023372154e-05}, "score": 4.924843349196523}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9339785002710317, "4": 0.06256167555097013, "3": 0.00332494881160114, "1": 0.00012481561370984555, "2": 6.7075821985459415e-06}, "score": 4.930268807873548}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9915790019233347, "4": 0.008073073614545255, "3": 0.00020154033961776232, "1": 0.0001448989434854455, "2": 0}, "score": 4.990944236482847}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9800761659308367, "4": 0.017619144719072194, "3": 0.0017045014767561152, "1": 0.0005888082376932338, "2": 8.112917609263424e-06}, "score": 4.9765922041571455}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9870756806808769, "4": 0.011948888708900679, "3": 0.0008409078297618187, "1": 0.00013084999070809571, "2": 1.8025558203009321e-06}, "score": 4.985840461519633}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962264179235291, "4": 0.003568421278163745, "3": 0.00010497975877094705, "1": 9.931400098743034e-05, "2": 0}, "score": 4.9958243595799035}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977826202267016, "4": 0.0020502449605895993, "1": 0.00011472013549735925, "3": 5.219525330837859e-05, "2": 0}, "score": 4.997386483417336}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7665553054839005, "4": 0.15692098195206436, "3": 0.07108742652038808, "1": 0.00524422399217877, "2": 0.00017872808237357727}, "score": 4.679386809744953}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9662077150043025, "4": 0.028911703512784246, "3": 0.0036254074390944333, "1": 0.001229671399706685, "2": 1.527072440664644e-05}, "score": 4.958872563024347}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9835576654294772, "4": 0.015449451158361695, "3": 0.0008507268978428833, "1": 0.0001325771258493577, "2": 0}, "score": 4.9823186171657206}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967402709906868, "4": 0.003095402601640266, "1": 9.589775367189011e-05, "3": 6.566168393078457e-05, "2": 0}, "score": 4.996389673026144}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9643150571469237, "4": 0.032874802372012374, "3": 0.002124312623984339, "1": 0.0006747740256208678, "2": 0}, "score": 4.9601770360812045}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9926905913198171, "4": 0.006810804709109877, "3": 0.0002505996279851542, "1": 0.0002458942481569609, "2": 9.927033090227895e-07}, "score": 4.991701431659615}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9989432174883517, "4": 0.0008585522650334291, "1": 0.00015986369692776381, "3": 3.779956361432303e-05, "2": 0}, "score": 4.998426392927813}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9976940857144612, "4": 0.0021028502344291366, "1": 0.00015651495397390601, "3": 4.52609467476689e-05, "2": 0}, "score": 4.997180564424323}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988014406467061, "4": 0.0011084444975839611, "1": 7.215391588476999e-05, "3": 1.678097086729052e-05, "2": 0}, "score": 4.998569376209051}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9979774089994237, "4": 0.0017436523743460204, "1": 0.0002174379577177505, "3": 6.054098404759981e-05, "2": 0}, "score": 4.997265511202441}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9717552515939379, "4": 0.026070504486408613, "3": 0.001954223209104289, "1": 0.00020056082312284028, "2": 9.488196552681941e-06}, "score": 4.969190033985776}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9850593478507279, "4": 0.013761932679238508, "3": 0.0010834747948195226, "1": 8.975381720215406e-05, "2": 0}, "score": 4.983712013027291}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9860801506416822, "4": 0.011929374202880592, "3": 0.0019146267192948787, "1": 6.590837750688624e-05, "2": 0}, "score": 4.983977579584704}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9869919298755154, "4": 0.012543449523331343, "3": 0.00028099153883256756, "1": 0.0001810714234207159, "2": 0}, "score": 4.986170246333805}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9671203608213212, "4": 0.03139515177685922, "3": 0.0011911361255119378, "1": 0.0002827634148174315, "2": 0}, "score": 4.965091152702807}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"5": 0.977901120345377, "4": 0.021247237331348857, "3": 0.0006350498869699664, "1": 0.00021070616035843076, "2": 0}, "score": 4.97663970074811}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9723488536304076, "4": 0.025473777226120434, "3": 0.0015972577921740969, "1": 0.0005686508116539564, "2": 6.207408871862984e-06}, "score": 4.969038319070541}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9485532375808126, "4": 0.04114888698405282, "3": 0.008191080996683538, "1": 0.0020876471765249654, "2": 1.706872015914687e-05}, "score": 4.9340670191115485}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9958841434507946, "4": 0.003970927040824182, "3": 7.77465796120956e-05, "1": 6.203703577827055e-05, "2": 0}, "score": 4.995625409145663}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9741450212199811, "4": 0.024554805512669985, "3": 0.0011560786207675553, "1": 0.00013945591892617888, "2": 2.3105406804908098e-06}, "score": 4.972568218081732}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5753137700352382, "4": 0.33466347643792776, "3": 0.08522552506927751, "1": 0.0040680618373073974, "2": 0.0007095289207773046}, "score": 4.476474358472743}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8280621309771717, "4": 0.1470446936468158, "3": 0.022204557908137364, "1": 0.0025204175417838652, "2": 0.00013251204645886344}, "score": 4.798059777412041}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8962328612363423, "4": 0.09837556784619843, "3": 0.004714084260996143, "1": 0.000648841884741724, "2": 1.6656500455221024e-05}, "score": 4.889549602482149}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9950541472076998, "4": 0.004814745937122848, "3": 6.656251344965537e-05, "1": 6.317139310676114e-05, "2": 0}, "score": 4.994799436323445}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9112181301893251, "4": 0.08575949244463313, "3": 0.0025795010247828534, "1": 0.00042152751663831697, "2": 1.2608038137350727e-05}, "score": 4.907356761550071}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7797329809678551, "4": 0.19938417254619564, "3": 0.02021399080929596, "1": 0.000647237663100618, "2": 1.973568775402783e-05}, "score": 4.757539231729388}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9223010594839384, "4": 0.07614544633881622, "3": 0.0013195632082304604, "1": 0.00022892846113648098, "2": 0}, "score": 4.920299314696871}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9168618485171565, "4": 0.07950574466463169, "3": 0.0033926464446816474, "1": 0.00022815005717231234, "2": 0}, "score": 4.912795349743738}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9762652050444782, "4": 0.0234320086571111, "3": 0.00021967134828108372, "1": 7.983284872902032e-05, "2": 0}, "score": 4.975809237854876}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9535681433032415, "4": 0.04535421332050278, "3": 0.0007387773263093667, "1": 0.00033246365902734075, "2": 0}, "score": 4.951838069039259}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9956081590637419, "4": 0.003808827042895811, "3": 3.165036110874992e-05, "1": 8.074997487508994e-06, "2": 0}, "score": 4.996093449861035}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9853862092976406, "4": 0.013589800919089554, "3": 0.0007274625775758342, "1": 0.0002852013887631442, "2": 5.0179077199290965e-06}, "score": 4.983799312455081}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9641768440610926, "4": 0.033053474156806574, "3": 0.0019597801115851733, "1": 0.0007848311177117573, "2": 1.6838645262183197e-05}, "score": 4.9598367945935955}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9613423807198248, "4": 0.037072363726005655, "3": 0.0012217585789313866, "1": 0.00034836084656450695, "2": 7.871696132608097e-06}, "score": 4.9590667632847385}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9886826287717625, "4": 0.010988697878272372, "3": 0.00029600624674341744, "1": 2.8592531803199225e-05, "2": 0}, "score": 4.988304871848392}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.969286237475733, "4": 0.030106610903416462, "3": 0.0005427631614160638, "1": 5.9158161342971066e-05, "2": 0}, "score": 4.968571065745684}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9923796039725957, "4": 0.007376588574642258, "3": 0.000154950166374633, "1": 8.624581715348496e-05, "2": 0}, "score": 4.9919685068499975}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9970908321537396, "4": 0.0027742895016717784, "3": 7.274702836234023e-05, "1": 6.033845074413014e-05, "2": 0}, "score": 4.996838856971122}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943866401125828, "4": 0.0053222879621928065, "1": 0.00015467088825909397, "3": 0.00013474667820754802, "2": 0}, "score": 4.9937895248540025}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939556390935234, "4": 0.005975955366328768, "3": 5.483537736217494e-05, "1": 1.1189217126203472e-05, "2": 0}, "score": 4.993869602414299}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9987448425698418, "4": 0.000964713878069281, "1": 0.00022629434377568613, "3": 6.32836219031164e-05, "2": 0}, "score": 4.998003539774913}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9956921754100141, "4": 0.003748605405632753, "1": 0.00033754440025275575, "3": 0.00021982286390473212, "2": 1.2430692935079552e-06}, "score": 4.994457838683316}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9986337914138436, "4": 0.001197885931019028, "1": 0.00011224719730311945, "3": 5.5180882289737374e-05, "2": 0}, "score": 4.9982427619432075}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999602894867123, "4": 0.0003396311439457801, "1": 4.998642946873283e-05, "3": 4.636619561604516e-06, "2": 0}, "score": 4.9994511483343125}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969038564687323, "4": 0.0029665322527511616, "3": 9.434455485535729e-05, "1": 3.453428359347579e-05, "2": 0}, "score": 4.996706639090975}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9951106987368645, "4": 0.004562379369430208, "3": 0.00021920372706526404, "1": 0.00010616405198587208, "2": 0}, "score": 4.994574548536723}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9980359458834641, "4": 0.001342725198533759, "1": 0.000456471769967614, "3": 0.00016415967102071345, "2": 0}, "score": 4.996503065940523}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962122222963273, "4": 0.0027692022407278965, "1": 0.0005674017223961097, "3": 0.00044943082909434094, "2": 1.2249959746169046e-06}, "score": 4.994058651146458}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988824364398056, "4": 0.0010585579728691283, "1": 3.3079923512802966e-05, "3": 2.4415582559852682e-05, "2": 0}, "score": 4.998760289295896}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9931471890350946, "4": 0.00613212459107351, "1": 0.0004250165706649743, "3": 0.00029313479603880314, "2": 0}, "score": 4.991581518193278}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9351880994913834, "4": 0.058673212625077624, "3": 0.005949799246963145, "1": 0.00018034750228066175, "2": 5.090319292489472e-06}, "score": 4.92869028183735}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9766575784731718, "4": 0.02142662438720121, "3": 0.0014181452827788283, "1": 0.0004895317186665306, "2": 4.888451359670333e-06}, "score": 4.973764208032633}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9785768026863394, "4": 0.019317257724458164, "3": 0.0017545801174591782, "1": 0.00033897608459153517, "2": 7.934057409617227e-06}, "score": 4.975793767828519}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970623984201957, "4": 0.0027620558592391384, "1": 0.00011903059464971271, "3": 5.398577348994386e-05, "2": 0}, "score": 4.996653841751567}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976681064977925, "4": 0.0021962542134283335, "3": 7.731334331478117e-05, "1": 5.770931263421466e-05, "2": 0}, "score": 4.997418280257432}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7999141496581231, "4": 0.16713150856920259, "3": 0.03201536612599756, "1": 0.0008135463962897734, "2": 0.00011846879090106651}, "score": 4.765226533089735}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9597304070009007, "4": 0.039315029625383496, "3": 0.000824024496281269, "1": 0.000122897608560379, "2": 0}, "score": 4.958545014179119}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9639655514697377, "4": 0.03457136986507055, "3": 0.0009634089247555775, "1": 0.0004909783130923061, "2": 4.920231380544055e-06}, "score": 4.961522993234576}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990397972704583, "4": 0.009050907047948227, "3": 0.0004437369171891105, "1": 0.00010550755460305084, "2": 1.0143525812187895e-06}, "score": 4.989636536914191}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9168457155580081, "4": 0.07608094041129185, "3": 0.005422716987106312, "1": 0.0016320316977302648, "2": 1.5276635320679902e-05}, "score": 4.906499358616048}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9418061275333661, "4": 0.05447499989930043, "3": 0.003558798112390423, "1": 0.0001442440357574013, "2": 1.1742967584448292e-05}, "score": 4.937794944569982}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.960766415070079, "4": 0.03517935057168081, "3": 0.0031546680577934595, "1": 0.0008685659844343473, "2": 1.9138357321416347e-05}, "score": 4.954979100266978}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8861264840895562, "4": 0.10215173224563279, "3": 0.010801941418875995, "1": 0.0008529539481762932, "2": 5.665348807565336e-05}, "score": 4.872661305372378}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961799241253426, "4": 0.0035426274841138454, "3": 0.0001597841046268216, "1": 0.00011642351781391727, "2": 0}, "score": 4.995672104865464}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9880625159332298, "4": 0.011310565388071394, "1": 0.00035298676311212125, "3": 0.00026986573511530705, "2": 0}, "score": 4.986737702162352}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9565917577173096, "4": 0.04230800361802507, "3": 0.0009755355067987137, "1": 0.00011308610932773226, "2": 0}, "score": 4.955288061510306}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969968645598681, "4": 0.002877092624816406, "1": 7.060327686667926e-05, "3": 5.447863235794857e-05, "2": 0}, "score": 4.996731533862311}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9426667455054497, "4": 0.05279423393551852, "3": 0.004346175569551001, "1": 0.00017541516890167279, "2": 6.9267488240791884e-06}, "score": 4.937790320610574}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.968481317946019, "4": 0.030355850874709225, "3": 0.001035305941802742, "1": 0.0001217302532647348, "2": 0}, "score": 4.967086425494981}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9771240125586639, "4": 0.021492167769690474, "3": 0.0010620166269746153, "1": 0.0003174437248208367, "2": 3.5822050908659665e-06}, "score": 4.97510325811418}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9348438584023667, "4": 0.06120700103560275, "3": 0.003425687833951439, "1": 0.0005015676822737632, "2": 1.8390653212411314e-05}, "score": 4.929879935580729}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9488503358760217, "4": 0.04780644576193178, "3": 0.002922847402492776, "1": 0.0004009178558084401, "2": 1.2823668409720699e-05}, "score": 4.944705350432315}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.828304979239296, "4": 0.16535290019074328, "3": 0.005900131737086444, "1": 0.0004087379157925925, "2": 2.5511429258464566e-05}, "score": 4.821133966052646}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9747318231478952, "4": 0.023732734056013123, "3": 0.0009909405652039369, "1": 0.0005336947562227901, "2": 0}, "score": 4.9721503048038125}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9703648860827825, "4": 0.028214230518627436, "3": 0.0011670719193819152, "1": 0.0002412202841112969, "2": 0}, "score": 4.968486347711619}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9763063369402899, "4": 0.022610632923630546, "3": 0.0007699661539436281, "1": 0.00030761609415538686, "2": 3.228241487825058e-06}, "score": 4.974609229308862}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9329046971775254, "4": 0.058497023873249336, "3": 0.008179785100868883, "1": 0.00038397062718803954, "2": 2.7749881168422735e-05}, "score": 4.923523755773152}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9701171117592705, "4": 0.02579300107550013, "3": 0.004032716744493234, "1": 5.11458092254203e-05, "2": 3.0202075613964505e-06}, "score": 4.965927819209335}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9866002862940952, "4": 0.011893398270378434, "3": 0.0009189765066245895, "1": 0.0005798671107918779, "2": 5.398788399671822e-06}, "score": 4.9839329506005345}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9960316019852862, "4": 0.0038419958300328996, "3": 0.00010202649739849055, "1": 2.3653723820709874e-05, "2": 4.051931378226341e-07}, "score": 4.995858119388449}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9104456391409349, "4": 0.0732349289776005, "3": 0.015536891286006844, "1": 0.000708520687675589, "2": 5.4882995132848115e-05}, "score": 4.892690503141817}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9943977242044804, "4": 0.005327009327837001, "3": 0.00022511639013928872, "1": 4.811165993202312e-05, "2": 0}, "score": 4.994030299083413}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9773074115168823, "4": 0.02162458753223438, "3": 0.000865207063422455, "1": 0.00019715467204520963, "2": 0}, "score": 4.975856243500896}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9900532642777854, "4": 0.009437690303509676, "1": 0.00030274884214424603, "3": 0.0001938817734259696, "2": 0}, "score": 4.988963413764016}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9947433497952842, "4": 0.004964317267518286, "3": 0.00023629347201235685, "1": 5.331136619978501e-05, "2": 0}, "score": 4.994349834909448}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"5": 0.943172515325123, "4": 0.05095665039301081, "3": 0.005748605358154087, "1": 0.00011134356017667867, "2": 7.878074789482788e-06}, "score": 4.937076941197798}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.986658190084124, "4": 0.012958781662501823, "3": 0.0003702278244723696, "1": 1.2046998695063701e-05, "2": 5.138014141185945e-07}, "score": 4.986251029994882}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9684599592945558, "4": 0.028423031334073232, "3": 0.0029830219950810243, "1": 0.00012371017827731464, "2": 5.762881199917163e-06}, "score": 4.96509863776325}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9755035195313054, "4": 0.023527924186564016, "3": 0.0008622404343785902, "1": 9.634433123182868e-05, "2": 0}, "score": 4.974361961969632}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9862638981574248, "4": 0.013263142915827562, "3": 0.0003804807398295665, "1": 8.63846119886089e-05, "2": 0}, "score": 4.98563026959353}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9937826668022893, "4": 0.005542856485519903, "3": 0.0003708237780426371, "1": 0.0002993575139567903, "2": 0}, "score": 4.992518033764378}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9967766307454536, "4": 0.002820966844875422, "1": 0.0002925397509038557, "3": 0.00010632724527007952, "2": 0}, "score": 4.995796204798815}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9730348367442592, "4": 0.0252074977236848, "3": 0.0014203684062455155, "1": 0.0003283872518862028, "2": 0}, "score": 4.970637954844158}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986311762949581, "4": 0.001254070397487271, "1": 7.813331684169542e-05, "3": 3.542407089901232e-05, "2": 0}, "score": 4.998362546235085}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9505502257979526, "4": 0.047024224272360186, "3": 0.001657207536566712, "1": 0.0007558317949443025, "2": 7.242761511862504e-06}, "score": 4.946616023972127}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9103867406759655, "4": 0.08213366482338672, "3": 0.006403810981350034, "1": 0.0009566738779311518, "2": 0}, "score": 4.901220252081839}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9537517991399317, "4": 0.04244173435606808, "3": 0.003277646318490814, "1": 0.0004826706601159782, "2": 2.060802489535139e-05}, "score": 4.949009163909334}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9597799399653931, "4": 0.03858765007301638, "3": 0.0014020967278349796, "1": 0.00021631540651729622, "2": 0}, "score": 4.957742303329306}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9849082956570389, "4": 0.01472495360814314, "3": 0.0003073550389250748, "1": 5.0844479793289235e-05, "2": 0}, "score": 4.984456825481789}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9503023375174284, "4": 0.04390714130653719, "3": 0.0053317130217045115, "1": 0.00043734246369277235, "2": 1.8723933240192278e-05}, "score": 4.943623736425525}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9944494714229976, "4": 0.005343018091463371, "1": 0.00011238725686714505, "3": 9.368794802420151e-05, "2": 0}, "score": 4.9940200484021116}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9976676308097527, "4": 0.0022822175478204075, "1": 3.3874094830238064e-05, "3": 1.2815758646724714e-05, "2": 0}, "score": 4.997556646097189}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991420291676316, "4": 0.0008180014898750863, "1": 2.3788268951501196e-05, "3": 1.4999105379610221e-05, "2": 0}, "score": 4.999056846108781}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978328195339551, "4": 0.0021094051303238793, "1": 3.688085412398492e-05, "3": 1.6625997054793773e-05, "2": 0}, "score": 4.997709809683427}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9920772824859041, "4": 0.007660471833990233, "1": 0.00014025687432046198, "3": 0.00011835819270776117, "2": 0}, "score": 4.991541753574692}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.887239066889782, "4": 0.0903485780778205, "3": 0.021275457513639715, "1": 0.001049237047876232, "2": 8.345166132715582e-05}, "score": 4.862652625650472}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9848079277821022, "4": 0.014138382738278032, "3": 0.0008833659533616559, "1": 0.00016306021633665722, "2": 0}, "score": 4.983442524227574}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8717515547033301, "4": 0.10519858808645599, "3": 0.020675120702498835, "1": 0.002290960768131108, "2": 7.53266174671671e-05}, "score": 4.84406003002777}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9855499142662194, "4": 0.013330255202513845, "3": 0.0009328244792021082, "1": 0.000175552221660721, "2": 0}, "score": 4.984101704856062}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9844472271964193, "4": 0.0144918682096166, "3": 0.000978754219066846, "1": 7.758387102456478e-05, "2": 0}, "score": 4.983240211334513}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5687834256899634, "4": 0.31217092644904926, "3": 0.11420018063716081, "1": 0.0043080479038822206, "2": 0.0005322690305082006}, "score": 4.440596832481352}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9756085810644847, "4": 0.022950682599965685, "3": 0.0008552245430985114, "1": 0.0005811792086789401, "2": 2.7620842505078954e-06}, "score": 4.973005822832027}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9033873667273931, "4": 0.0766589282263112, "3": 0.01365536901847725, "1": 0.006175465590742224, "2": 0.00010996680614823844}, "score": 4.8709969063470115}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9197281010106823, "4": 0.07617686281463364, "3": 0.003602596296438377, "1": 0.00047167045725702824, "2": 1.416911446305951e-05}, "score": 4.9146881923359915}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9791092962286413, "4": 0.01969338276340735, "3": 0.0007444312901688435, "1": 0.00044679235566108565, "2": 3.0504787879781635e-06}, "score": 4.977021363784022}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7721199695958164, "4": 0.1905289361785518, "3": 0.035212596685898524, "1": 0.0019109392573919614, "2": 0.00021897324599868867}, "score": 4.730742882099945}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9277489971412288, "4": 0.0643447006701054, "3": 0.006455709150933254, "1": 0.0013997312850970575, "2": 3.836457692595143e-05}, "score": 4.917028825251512}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9390762459270494, "4": 0.05440450587313823, "3": 0.005935396179935741, "1": 0.0005471341165206666, "2": 3.130661941093563e-05}, "score": 4.93144187445519}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9705342984381227, "4": 0.02797335021698517, "3": 0.0010897735027236186, "1": 0.00038321897341735313, "2": 0}, "score": 4.9683136134713}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9756797386956099, "4": 0.023328971005188593, "3": 0.0005345953780070852, "1": 0.00044427549665206767, "2": 0}, "score": 4.973824411166437}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.937719350161034, "4": 0.0604635847573481, "3": 0.0017294549118085402, "1": 8.12012432462048e-05, "2": 3.5408172354157458e-06}, "score": 4.93574189369507}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9534429670941348, "4": 0.04475211825832466, "3": 0.0017099393105565286, "1": 8.952272986097518e-05, "2": 0}, "score": 4.951469647584173}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9157105845170126, "4": 0.08172675926167566, "3": 0.0019465903020082212, "1": 0.0006043002384548699, "2": 5.770825038832979e-06}, "score": 4.9119450188284555}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9954526745351832, "4": 0.004404200210926757, "1": 7.331385127550489e-05, "3": 6.69028493872116e-05, "2": 0}, "score": 4.995168724633175}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9892345804000751, "4": 0.010518612205542182, "3": 0.0001638537985489974, "1": 7.953113323066441e-05, "2": 0}, "score": 4.988835517454413}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9826916968232163, "4": 0.016391751958879142, "3": 0.0007132832153071289, "1": 0.00019593844581944535, "2": 3.585107852449299e-06}, "score": 4.981387102808628}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9654113220417867, "4": 0.03344468496335526, "3": 0.0009846650749947155, "1": 0.0001510801601630171, "2": 0}, "score": 4.963981367172975}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.936807224347132, "4": 0.055516983279705646, "3": 0.007081968310191853, "1": 0.0005504337247815359, "2": 2.3490229246921864e-05}, "score": 4.928045442609513}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9875860527284601, "4": 0.012120008463895496, "3": 0.00020891460040622733, "1": 7.939271059769425e-05, "2": 0}, "score": 4.9871445190973045}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9942053713008693, "4": 0.005499299821662353, "3": 0.00017048470022804145, "1": 0.00012240479669123783, "2": 0}, "score": 4.993670096150073}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9668924016390849, "4": 0.03146321478957706, "3": 0.0014546319000824676, "1": 0.00017900317765831493, "2": 6.136095071302732e-06}, "score": 4.964892938486654}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8399485827753269, "4": 0.12497454530209799, "3": 0.031524769777900266, "1": 0.0032174620932277215, "2": 0.00028255848563749265}, "score": 4.798247883746158}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9429761597041671, "4": 0.046698221432019446, "3": 0.008682680366450434, "1": 0.0015872282864315662, "2": 4.757652931258616e-05}, "score": 4.929444201223013}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9883519262507592, "4": 0.01126867304611152, "3": 0.00030316995564090413, "1": 7.420381455613585e-05, "2": 0}, "score": 4.987828147112853}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9873886757297299, "4": 0.011954641093236514, "3": 0.00034092160652457096, "1": 0.00031175342097750704, "2": 0}, "score": 4.986116446362446}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9109483857711053, "4": 0.051268825581124416, "1": 0.022833523361847942, "3": 0.014807955631018084, "2": 0.00013603613622302111}, "score": 4.8273721509445915}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9980253794334295, "4": 0.0016952077148900205, "3": 0.0001887600360731884, "1": 8.991309187532754e-05, "2": 0}, "score": 4.9975676180461726}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9964982537641152, "4": 0.002817447347193829, "3": 0.0003633632991809865, "1": 0.000317314868828096, "2": 0}, "score": 4.99518654915097}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9914252368004658, "4": 0.007581900387489128, "3": 0.0005683248407433451, "1": 0.0004191083833550803, "2": 3.2094467105289047e-06}, "score": 4.989595364957712}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9711347187875125, "4": 0.02421483783576196, "3": 0.00251055533827982, "1": 0.0021144101378834214, "2": 2.166730750543976e-05}, "score": 4.962241265130455}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9699869889774293, "4": 0.02757473290550245, "3": 0.001893984439373288, "1": 0.0005285969636214745, "2": 1.0502691503310852e-05}, "score": 4.966491228241438}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9758069668469408, "4": 0.02353699124240924, "3": 0.0005101582429901802, "1": 0.00014124988529625018, "2": 0}, "score": 4.9748775763185815}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9924762448174267, "4": 0.006987412241051283, "3": 0.0004120798568875025, "1": 0.00011957270040329295, "2": 0}, "score": 4.991710098360737}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9731812447411449, "4": 0.025095284977307234, "3": 0.0014937732164678201, "1": 0.00020885715678997478, "2": 0}, "score": 4.97108113729615}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9946866112528104, "4": 0.005033182958854137, "3": 0.00015215329889444232, "1": 0.00012510789912485, "2": 0}, "score": 4.994162061656521}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9807576144671039, "4": 0.017878328463291265, "3": 0.0011901975229030204, "1": 0.00016453323034227855, "2": 4.750507991771008e-06}, "score": 4.979068796268381}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.998580654924347, "4": 0.0013329296698235626, "1": 4.530421425004369e-05, "3": 4.036162906252333e-05, "2": 0}, "score": 4.998405129019595}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9543394463848297, "4": 0.04260601663995233, "3": 0.0024131845830740973, "1": 0.0006342832098727054, "2": 4.383583576247279e-06}, "score": 4.950017196369928}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903929395148751, "4": 0.008794726486724103, "3": 0.0004819863807588048, "1": 0.00032748542752035573, "2": 1.3814981938045112e-06}, "score": 4.988927198151688}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975533824594368, "4": 0.0021709719684156388, "1": 0.00021381636902061078, "3": 6.114154328488433e-05, "2": 0}, "score": 4.996851477303819}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9888689981804138, "4": 0.010651953248798965, "3": 0.0003896771430582987, "1": 8.531689989961357e-05, "2": 0}, "score": 4.988227377133059}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9805311993648633, "4": 0.018305897560268503, "3": 0.0009678721072750658, "1": 0.00019106574012519307, "2": 0}, "score": 4.97899401197116}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9412003342474079, "4": 0.05195340602829782, "3": 0.0061726656520309075, "1": 0.0006445739513268963, "2": 2.2483743972202533e-05}, "score": 4.933055078053171}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9734744149745929, "4": 0.02405347024279184, "3": 0.0020315992260360907, "1": 0.00042950894079697233, "2": 6.311204576666362e-06}, "score": 4.970146221752453}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9981391379547138, "4": 0.0018042422165037446, "3": 2.1032514670624845e-05, "1": 5.136631723585037e-06, "2": 0}, "score": 4.998133089378558}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9394601051004076, "4": 0.05229020031197957, "3": 0.007814802401072615, "1": 0.0004083319954940606, "2": 2.206312268469817e-05}, "score": 4.930380364451585}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9506961911394566, "4": 0.042881546375858746, "3": 0.005987962948914062, "1": 0.00038243838600985947, "2": 2.6456782640502277e-05}, "score": 4.94353196929977}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9349371137282745, "4": 0.058424818798486294, "3": 0.006333307927115068, "1": 0.0002611783632349952, "2": 2.1326310772590427e-05}, "score": 4.9277982661216715}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9841188979297184, "4": 0.015042100640009834, "3": 0.0006665042778410114, "1": 0.00015305365680196007, "2": 0}, "score": 4.983012345877722}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9362469049037162, "4": 0.056766949364326316, "3": 0.0064326261670596754, "1": 0.0005048590381650675, "2": 3.375054475118986e-05}, "score": 4.928246040664399}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9708443084490177, "4": 0.027483798318016932, "3": 0.0013971979671196265, "1": 0.0002651250384641858, "2": 5.409283033735402e-06}, "score": 4.968644947278157}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.895571206257923, "4": 0.09436640013144987, "3": 0.009444884564186158, "1": 0.0005820809677871038, "2": 2.8660204506000987e-05}, "score": 4.884328743407004}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8914308237807906, "4": 0.09780834288569266, "3": 0.010131248708065997, "1": 0.0005916161669496029, "2": 3.240570728198988e-05}, "score": 4.879464807401241}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9783828953783316, "4": 0.020781119933181914, "3": 0.0005824012003752762, "1": 0.0002465209692865552, "2": 0}, "score": 4.977067831830052}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9687139382884647, "4": 0.027491044002192787, "1": 0.002711789038753174, "3": 0.0010726618601439749, "2": 5.771393493095217e-06}, "score": 4.95949896772269}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9906563467600984, "4": 0.009008637857306205, "3": 0.00026770417814374873, "1": 6.544254341885611e-05, "2": 8.26860366159572e-07}, "score": 4.990191692813331}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9845759402716702, "4": 0.013938144342198854, "3": 0.0011159071694267963, "1": 0.0003634842829599166, "2": 4.176570929059538e-06}, "score": 4.982363533075134}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9949402604248736, "4": 0.0043829818436593795, "3": 0.000445248502090022, "1": 0.0002297405337433894, "2": 1.1233705188299721e-06}, "score": 4.993804184907315}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941053530083421, "4": 0.005415231217471814, "1": 0.0002806113337459185, "3": 0.0001968812111861502, "2": 1.087192361478658e-06}, "score": 4.993065293650417}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9952817669976958, "4": 0.004424255337475847, "1": 0.00016151072642739802, "3": 0.0001312104546233165, "2": 0}, "score": 4.994667274147085}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9529145381517172, "4": 0.04172145809148302, "3": 0.004394206544910928, "1": 0.0009507480140335511, "2": 1.7454867646345767e-05}, "score": 4.945634685483359}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9737545550156568, "4": 0.022879336774938627, "3": 0.002589374340052831, "1": 0.0007634812435592082, "2": 1.0338094398677612e-05}, "score": 4.968856884519935}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9761278590736268, "4": 0.023155047214237497, "3": 0.0006394948436973562, "1": 7.387131241737188e-05, "2": 0}, "score": 4.975270385667676}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9644770419290035, "4": 0.0333011049787907, "3": 0.0019060376891403676, "1": 0.00030330095335521004, "2": 6.759653003973647e-06}, "score": 4.961653116191976}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9768751541571352, "4": 0.021582762830147182, "3": 0.0013170867354990526, "1": 0.00022039173089821387, "2": 3.3455816269253935e-06}, "score": 4.974891428419577}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9813471131179319, "4": 0.01736208800841844, "3": 0.0011385599691756043, "1": 0.0001447199590264792, "2": 0}, "score": 4.979781760197283}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.997389350288549, "4": 0.002414997082386168, "1": 0.00013553617216811251, "3": 5.37953244880291e-05, "2": 0}, "score": 4.996935248207263}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9901088830721655, "4": 0.00940481487595707, "3": 0.00033784488092412587, "1": 0.00014590993648369, "2": 0}, "score": 4.989335828452114}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9919586788003156, "4": 0.007698367389046834, "3": 0.0002153723860345101, "1": 0.00012518386267222284, "2": 0}, "score": 4.991370131697552}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9923393381931744, "4": 0.007256381430149523, "1": 0.0002812985491901197, "3": 0.00011864128845336507, "2": 0}, "score": 4.99138110438553}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.99378160425043, "4": 0.005902605590794144, "3": 0.00015781690910526985, "1": 0.00015398613377909674, "2": 0}, "score": 4.993165788807087}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9676829754958196, "4": 0.030055325872833997, "3": 0.002065178738790316, "1": 0.00018350364993748012, "2": 7.334194267876141e-06}, "score": 4.965058100925471}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9183560220150074, "4": 0.06774009697614615, "3": 0.013075504299807406, "1": 0.0007549662588339869, "2": 6.336290261711006e-05}, "score": 4.902897965043736}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9889146914114323, "4": 0.010672108746194302, "3": 0.00034132088889943067, "1": 6.611287826852257e-05, "2": 0}, "score": 4.988380730965354}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9767840423300843, "4": 0.022168757525013703, "3": 0.0006580770080343414, "1": 0.00038086940904680445, "2": 0}, "score": 4.97499140440859}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9802149672847287, "4": 0.017384018010320235, "3": 0.001435314198613203, "1": 0.0009553980481278312, "2": 8.108748641128866e-06}, "score": 4.975899382284263}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9971436936274373, "4": 0.0023188138397960776, "1": 0.00042116848602810435, "3": 0.00011360761732590689, "2": 0}, "score": 4.9957692854890015}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.99868764888687, "4": 0.0008616925684887226, "1": 0.0003890699929767085, "3": 5.976950361986835e-05, "2": 0}, "score": 4.997462483836501}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9976666828264203, "4": 0.0021080329868808623, "1": 0.0001499706424534628, "3": 7.449638181498136e-05, "2": 4.864226211876325e-07}, "score": 4.997141631466436}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941763856658091, "4": 0.005359717556342833, "1": 0.00027912244540496847, "3": 0.00018281222953607116, "2": 1.1260619635107262e-06}, "score": 4.993154784294194}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9518295103455732, "4": 0.044005141483183165, "3": 0.00352276002008581, "1": 0.0006187812749407251, "2": 1.890337652005987e-05}, "score": 4.946417240504276}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9935331310852917, "4": 0.00598146355096341, "3": 0.0003486097696094894, "1": 0.00013291695809120778, "2": 0}, "score": 4.992789621111017}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9961613537115266, "4": 0.0037081706879092432, "3": 0.00010955421687129989, "1": 1.9378448722191596e-05, "2": 0}, "score": 4.995995200904313}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9866485509740207, "4": 0.01277917993413061, "3": 0.00047996445926576164, "1": 8.847097728650836e-05, "2": 0}, "score": 4.985906953210308}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9857565130929695, "4": 0.013793907083557018, "3": 0.000361328153524443, "1": 8.473074797888952e-05, "2": 0}, "score": 4.985144461312286}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9715715732013224, "4": 0.024599577770301542, "3": 0.0033830080826176565, "1": 0.00041863325823399605, "2": 1.7280514858156906e-05}, "score": 4.966907702974007}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9744364081876, "4": 0.024657997226857326, "3": 0.0007699884832858667, "1": 0.00012365588142808131, "2": 0}, "score": 4.973307083294609}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9853922339673418, "4": 0.012174337819922306, "3": 0.0022388162782554784, "1": 0.0001853145326617517, "2": 4.656055162450365e-06}, "score": 4.982592722534223}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960867199150024, "4": 0.0037260279704519946, "3": 0.00014240719978166836, "1": 4.3613623099634034e-05, "2": 0}, "score": 4.995814697984259}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9942797440245724, "4": 0.005396660190458482, "3": 0.00027453604339667533, "1": 4.770120015043583e-05, "2": 0}, "score": 4.993863454585396}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9705881995276324, "4": 0.02354460198188765, "3": 0.004175240573267083, "1": 0.0016700299810334177, "2": 1.9273431821169873e-05}, "score": 4.961366874100181}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999267474727732, "4": 0.0006090647342051624, "1": 0.00010331241552998152, "3": 1.96295593050849e-05, "2": 0}, "score": 4.998938425934571}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9919451897419377, "4": 0.00712826080983488, "3": 0.0007778906471712534, "1": 0.0001464457507695751, "2": 1.3940616797670842e-06}, "score": 4.990725985112393}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970172477709265, "4": 0.002849137391968409, "3": 8.351377246566161e-05, "1": 4.960350804602676e-05, "2": 0}, "score": 4.996785419431481}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9960392903828953, "4": 0.003858416163679836, "3": 8.287185988084302e-05, "1": 1.8596558895110384e-05, "2": 0}, "score": 4.995901450499533}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.801004423065148, "4": 0.19219707520836474, "3": 0.006623916948140814, "1": 0.00015827350138565184, "2": 1.3005086601411221e-05}, "score": 4.793882300165655}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9814925997786051, "4": 0.0180556684852578, "1": 0.00023912479201008765, "3": 0.0002077645688193234, "2": 0}, "score": 4.980572209132409}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9410168528932609, "4": 0.05575231749995374, "3": 0.00296547427939737, "1": 0.00024707713071036566, "2": 0}, "score": 4.937327279874105}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9531255558496621, "4": 0.046372373304170475, "3": 0.00045992597745776113, "1": 3.745894592595487e-05, "2": 0}, "score": 4.952557716646334}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9646163417619977, "4": 0.034580788388966506, "3": 0.0006621838642706087, "1": 0.0001311295227428665, "2": 0}, "score": 4.963569977649396}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9964271104141412, "4": 0.003511501693825804, "3": 3.791743595818748e-05, "1": 1.948154404111711e-05, "2": 0}, "score": 4.9963347226376245}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9977560365587099, "4": 0.00218439800714281, "3": 3.7329897904000035e-05, "1": 2.0951820877065398e-05, "2": 0}, "score": 4.9976571319059655}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9951331274911267, "4": 0.0046694144528096546, "3": 0.00015026862983336263, "1": 4.522796354132929e-05, "2": 0}, "score": 4.994849126330111}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9949616174447574, "4": 0.004809471866294514, "1": 0.00011777459171932163, "3": 0.00010703207522136214, "2": 0}, "score": 4.9945053430661925}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939385576156651, "4": 0.005904542553429827, "3": 0.00012113147887739247, "1": 3.4361321540158416e-05, "2": 0}, "score": 4.99371574036051}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"5": 0.988284394470888, "4": 0.011354482262690117, "3": 0.00031915330202666526, "1": 4.009920697627675e-05, "2": 0}, "score": 4.9878467915696465}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954679125436262, "4": 0.004378009981332434, "3": 0.0001423851283762804, "1": 1.0716049361030648e-05, "2": 0}, "score": 4.995294350970359}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984092781413373, "4": 0.0015229473128316171, "3": 5.664561378808647e-05, "1": 9.769678493246737e-06, "2": 0}, "score": 4.998324680468436}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972278599959747, "4": 0.0026900002296409774, "1": 4.37422107942519e-05, "3": 3.685559938964398e-05, "2": 0}, "score": 4.997061315197056}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9985955160120935, "4": 0.0013546227184356371, "1": 2.5544922220230145e-05, "3": 2.3585675513037253e-05, "2": 0}, "score": 4.998496025142745}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9212872058734352, "4": 0.07146401805056515, "3": 0.006296313346288078, "1": 0.00091767560615066, "2": 3.183656773710828e-05}, "score": 4.912176884002039}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9993244891202749, "4": 0.0006380607881029664, "1": 2.7325478844808802e-05, "3": 9.442087205205675e-06, "2": 0}, "score": 4.999233752599125}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9928816354344328, "4": 0.006709277559764239, "3": 0.00030979523840486353, "1": 9.752137238826018e-05, "2": 0}, "score": 4.992281032808252}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9802315761878446, "4": 0.0185234052106452, "3": 0.0009278003392470057, "1": 0.00031107173911199107, "2": 4.065726947823333e-06}, "score": 4.97836446495443}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9813125703075072, "4": 0.01791258751760511, "3": 0.0006648095162965439, "1": 0.00010579841708938121, "2": 0}, "score": 4.980334516513038}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9791724958568954, "4": 0.017803564302790377, "3": 0.0019038268250109746, "1": 0.0011089873248832577, "2": 9.688460691953482e-06}, "score": 4.9739237298879875}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999269008604483, "4": 0.0006473697130525278, "3": 6.355143372506857e-05, "1": 1.9568841031525984e-05, "2": 0}, "score": 4.999147251627797}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983615125885531, "4": 0.001585228528543108, "3": 3.955628356043844e-05, "1": 1.3295432536851106e-05, "2": 0}, "score": 4.99828247647487}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992406885229708, "4": 0.0007320468817113986, "1": 1.3780196950386777e-05, "3": 1.2799390568603916e-05, "2": 0}, "score": 4.999187232992598}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9974644184311988, "4": 0.002399109625108513, "3": 6.861681065316117e-05, "1": 6.60422413638059e-05, "2": 0}, "score": 4.997199482711097}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7754732041194292, "4": 0.19744650343816952, "3": 0.025942508521719383, "1": 0.0010610842672768407, "2": 7.107431771363882e-05}, "score": 4.746209491839339}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9355155886170855, "4": 0.06078717802479781, "3": 0.003395144351581913, "1": 0.0002783239040555834, "2": 1.4662094499282661e-05}, "score": 4.931264625673657}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8573765717092691, "4": 0.13390552031335312, "3": 0.007955734417164583, "1": 0.000704438166371405, "2": 4.0132984726988246e-05}, "score": 4.8472421703268385}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8867344016091574, "4": 0.10570311672734824, "3": 0.005468454191600878, "1": 0.002051656014469361, "2": 3.4466180157867945e-05}, "score": 4.875048964518518}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8730070915322357, "4": 0.12030993189694413, "3": 0.005748609382179247, "1": 0.0008949425783641445, "2": 3.131789182283598e-05}, "score": 4.864518027035561}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9889052488045827, "4": 0.010604014745459264, "3": 0.0003174126168601194, "1": 0.00016824303281744366, "2": 0}, "score": 4.988088127367705}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9965469116698176, "4": 0.0033049861377964737, "3": 0.00010837924002327968, "1": 3.85821817794663e-05, "2": 0}, "score": 4.996323922461478}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9922799438965513, "4": 0.006849785096320955, "3": 0.00046451082284155586, "1": 0.00040101889983911723, "2": 0}, "score": 4.9906170731715145}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9863951771391977, "4": 0.012848895816628896, "3": 0.000502391430540973, "1": 0.00024701932142572936, "2": 0}, "score": 4.985158147322737}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.985974560916362, "4": 0.013358577381019865, "1": 0.0003364153502369599, "3": 0.00032603983200402625, "2": 0}, "score": 4.984643613885795}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.973086415768863, "4": 0.02564574777142527, "3": 0.001034421133531938, "1": 0.00022575730666760753, "2": 0}, "score": 4.971382161578875}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9795633224095275, "4": 0.01904282669054957, "3": 0.0011843016535644257, "1": 0.00019836654526264933, "2": 6.6244447561283236e-06}, "score": 4.977775129180345}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9843991676559305, "4": 0.013841125636262473, "3": 0.0011617474325343916, "1": 0.0005852371548359176, "2": 6.162802084498377e-06}, "score": 4.981475820967084}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872527177207229, "4": 0.011237678443751448, "3": 0.0009534415836323617, "1": 0.000534983314181731, "2": 0}, "score": 4.984715181416036}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9863019341580817, "4": 0.012140855819442967, "3": 0.0012681463647690517, "1": 0.00028085051647964597, "2": 6.221080204332697e-06}, "score": 4.984180754631585}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9785391291832135, "4": 0.02032381353324964, "3": 0.0010255454106087541, "1": 0.00010806269392057412, "2": 1.5045721287773544e-06}, "score": 4.97718828679365}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9934905293973686, "4": 0.006220954048437525, "3": 0.00017414278357418794, "1": 0.00010894634986284498, "2": 0}, "score": 4.992994936965538}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9458297106667444, "4": 0.04543906869717008, "3": 0.005752159094256778, "1": 0.002945658168767516, "2": 3.062784486079483e-05}, "score": 4.931181905898105}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9702231426225358, "4": 0.027663002731915663, "3": 0.0014881195545485963, "1": 0.0006163084433654189, "2": 4.6284524027833155e-06}, "score": 4.966881480119192}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.983453312546677, "4": 0.014448466422307417, "3": 0.0015078854105236466, "1": 0.0005783571346985006, "2": 8.481620752065258e-06}, "score": 4.980196820106547}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9813306992433874, "4": 0.017756275078266492, "3": 0.0005957877967617534, "1": 0.000313764140252491, "2": 0}, "score": 4.979797022587282}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9908797362202348, "4": 0.00838283178276314, "3": 0.0005678995519730126, "1": 0.00016679434024503384, "2": 1.8012017084732236e-06}, "score": 4.989808778598999}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9884772300376992, "4": 0.010864471596548715, "3": 0.0005347256747767222, "1": 0.00012012844651663352, "2": 0}, "score": 4.987585520509329}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963178828800312, "4": 0.0035084462616711185, "1": 0.00010760849107646918, "3": 6.471846519725133e-05, "2": 0}, "score": 4.995931677376201}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9943574085581856, "4": 0.005486331838792232, "3": 0.00012708085761027464, "1": 2.7703245100225718e-05, "2": 0}, "score": 4.994148684831969}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9761301315019278, "4": 0.021150344187110887, "3": 0.0025857297735833317, "1": 0.00013081728229914026, "2": 2.168341431353383e-06}, "score": 4.973148400391607}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9821933754536224, "4": 0.017039684040109023, "3": 0.0006558463624712785, "1": 0.00010826723380628907, "2": 1.645235537674718e-06}, "score": 4.981210596390151}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9753871440261356, "4": 0.022176994748403754, "3": 0.0020656238327656775, "1": 0.000363067133509988, "2": 5.558179118573325e-06}, "score": 4.972222769735549}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987874062866239, "4": 0.00115923728853721, "1": 3.015203925791268e-05, "3": 2.176413775220467e-05, "2": 0}, "score": 4.998676624372937}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9988192780013886, "4": 0.0011484791386461018, "1": 1.732953996802901e-05, "3": 1.404355480745461e-05, "2": 0}, "score": 4.998754114508239}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9084836572730542, "4": 0.0850087913664094, "3": 0.005850378025982935, "1": 0.0006344273988327637, "2": 1.6292673984298404e-05}, "score": 4.900703224176256}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9718074858142747, "4": 0.025874164959861657, "3": 0.0017844989561285832, "1": 0.000512343274281493, "2": 1.2670146512054754e-05}, "score": 4.968469174958082}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9580851364635733, "4": 0.03849754907901982, "3": 0.002772457965724609, "1": 0.0006238699654579307, "2": 1.293751923728356e-05}, "score": 4.953422867670324}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9759534123073148, "4": 0.02228355759620796, "1": 0.0010753472997966182, "3": 0.000674961031411823, "2": 0}, "score": 4.972064775756416}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9283089233974214, "4": 0.067070343994226, "3": 0.003096007192804771, "1": 0.001498414095266954, "2": 1.807112856745871e-05}, "score": 4.920689118316524}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9252399543523946, "4": 0.07223703604446106, "3": 0.002430459365973806, "1": 7.585749830768014e-05, "2": 0}, "score": 4.922597323167689}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9507155912438715, "4": 0.04822081522525896, "3": 0.0009905604142456939, "1": 6.323775790494497e-05, "2": 0}, "score": 4.94954461868607}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9478929813223703, "4": 0.051224773834808, "3": 0.0006543749845171426, "1": 0.00021555445261300533, "2": 0}, "score": 4.946603600787387}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963566923096864, "4": 0.0035736760753433986, "3": 4.498569534280117e-05, "1": 2.262798824438064e-05, "2": 0}, "score": 4.996245833005341}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970831246713965, "4": 0.002845811542168971, "3": 5.233972055027749e-05, "1": 1.7086788421500624e-05, "2": 0}, "score": 4.99698115692036}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9938109232278007, "4": 0.006020901379837133, "3": 0.000113466377319452, "1": 5.284608108780225e-05, "2": 0}, "score": 4.993540769508053}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9810046552649009, "4": 0.018087629995773406, "3": 0.0008368388825254699, "1": 6.702713637832403e-05, "2": 0}, "score": 4.979970506605741}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9900654152760623, "4": 0.008664332437849446, "3": 0.0007693846641997334, "1": 0.0004973701701228468, "2": 2.3054331075787805e-06}, "score": 4.987800486711889}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9836029927453548, "4": 0.01535348799219563, "3": 0.0008192108984463567, "1": 0.00021617787365883615, "2": 0}, "score": 4.982143233532009}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9915664525788987, "4": 0.007754809867983247, "3": 0.0004111588178425069, "1": 0.00026390720838311954, "2": 0}, "score": 4.990367208295745}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9665699832551556, "4": 0.030239365803415453, "3": 0.002160303625075756, "1": 0.0010040002587434838, "2": 2.015193992524376e-05}, "score": 4.961363330732969}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994699581056091, "4": 0.00418481827049115, "1": 0.0008764972421873545, "3": 0.00023337732351696113, "2": 2.8556416330042732e-06}, "score": 4.991833847748164}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918709449271783, "4": 0.006126066593483292, "3": 9.086533342346406e-05, "1": 8.178031428341557e-05, "2": 0}, "score": 4.993352915038225}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.995766520247287, "4": 0.0034533258424360915, "1": 0.0005128913133781267, "3": 0.00026382857575186515, "2": 1.785632256725774e-06}, "score": 4.993962084902945}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944863754315042, "4": 0.005240900207918674, "3": 0.00013953333844311165, "1": 0.00013183624153289625, "2": 0}, "score": 4.993952679956272}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9831054754981101, "4": 0.0142053915474136, "3": 0.0018043686983162562, "1": 0.0008688199033800434, "2": 1.1188210141977082e-05}, "score": 4.978676925396424}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9359605694948142, "4": 0.059108567436021484, "3": 0.004565975941236504, "1": 0.00034566170237690185, "2": 1.665821616312537e-05}, "score": 4.930326680357508}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9699486286905304, "4": 0.0268490376602782, "3": 0.0026641212848346448, "1": 0.0005198222665033263, "2": 1.1289053709632204e-05}, "score": 4.965709320043278}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931224957303748, "4": 0.006680639249361188, "3": 0.00011274927610013646, "1": 8.295966766647306e-05, "2": 0}, "score": 4.992762015160108}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9784916535734639, "4": 0.020771222165481218, "3": 0.0006508300563427349, "1": 8.387759703435534e-05, "2": 1.8770897234199245e-06}, "score": 4.977585963971752}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9187627738881649, "4": 0.06160119557167009, "3": 0.01566292224726933, "1": 0.0038618895289766145, "2": 0.00010677561302231308}, "score": 4.891304592028718}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9876523358030392, "4": 0.010524851592375428, "3": 0.0013311390163258318, "1": 0.0004843799202368107, "2": 4.775962660776056e-06}, "score": 4.984860984690463}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9701437069143104, "4": 0.024463927337023322, "3": 0.004127468557526401, "1": 0.001236503673650423, "2": 2.1665075887697e-05}, "score": 4.962269871760693}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9942745541961373, "4": 0.005142877146457225, "3": 0.00031803249336852257, "1": 0.0002611801914899367, "2": 1.834490081162462e-06}, "score": 4.9931708232401295}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9861602423378768, "4": 0.012195685955288716, "3": 0.0011288803253599355, "1": 0.0005088072483850685, "2": 4.803801376704558e-06}, "score": 4.983496886915928}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9368850622089016, "4": 0.05864831699686552, "3": 0.004103954327304641, "1": 0.0003238387018268868, "2": 2.7738700219424396e-05}, "score": 4.931764446772083}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9626426192047538, "4": 0.03268678209745291, "3": 0.0037004324047930207, "1": 0.0009438005461507796, "2": 1.625810506993891e-05}, "score": 4.956087932745703}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9728177243539504, "4": 0.02318819884965446, "3": 0.0038882165380184786, "1": 9.656289502565566e-05, "2": 5.563467461123398e-06}, "score": 4.96863230896813}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9926878845540721, "4": 0.006865406693013602, "3": 0.0002231458420600169, "1": 0.00021916690393234678, "2": 0}, "score": 4.991811598010865}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9965129323911515, "4": 0.0033164909426464362, "3": 0.00011499567948528007, "1": 5.234725801272094e-05, "2": 0}, "score": 4.996244116520824}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9815422115573815, "4": 0.01702423605340564, "3": 0.0012728762187433215, "1": 0.000157030814684339, "2": 2.6907785027329523e-06}, "score": 4.97979379662648}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936829569438823, "4": 0.006161444698235409, "3": 0.0001317530791049943, "1": 2.2020185556049478e-05, "2": 0}, "score": 4.993486956514418}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9893271058587038, "4": 0.010228063634244045, "3": 0.00032074344216281983, "1": 0.0001216847346625229, "2": 0}, "score": 4.988643683261157}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9859518502398859, "4": 0.012799394677437593, "3": 0.000980394025764837, "1": 0.00026440144098042144, "2": 2.1653858298195063e-06}, "score": 4.984175686957163}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9857775986502938, "4": 0.013770595789035153, "3": 0.00041288291664573734, "1": 3.5737106900949444e-05, "2": 0}, "score": 4.9852606429973}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7335562112849875, "4": 0.18000929329644233, "3": 0.061188904801056654, "1": 0.023297363018195946, "2": 0.0019390533285105623}, "score": 4.598602602514703}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9867684449367513, "4": 0.011674204672703256, "3": 0.001292916189412159, "1": 0.0002600678498582171, "2": 2.3463045487075566e-06}, "score": 4.984692621713773}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9921225787924295, "4": 0.007030593168335125, "3": 0.0007404673626311427, "1": 0.00010235811113484416, "2": 2.3096397453191933e-06}, "score": 4.991072095628349}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952782224075226, "4": 0.004504293166544673, "1": 0.00011061365650074899, "3": 0.00010255903232962382, "2": 0}, "score": 4.9948481119292065}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830942976524, "4": 0.015104176258349531, "3": 0.0011831546210891082, "1": 0.0006031274642959954, "2": 0}, "score": 4.980116701541211}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9309984747486696, "4": 0.06588329893615154, "3": 0.0028748393055979373, "1": 0.0002298319886741434, "2": 7.0271664417660015e-06}, "score": 4.927426139247029}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9885082217558853, "4": 0.010988917654427685, "3": 0.00040890733188548705, "1": 9.094251084872186e-05, "2": 0}, "score": 4.987829460995993}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9723718499527264, "4": 0.026068390254228038, "3": 0.001444013340472233, "1": 0.00011180771415792297, "2": 0}, "score": 4.970596236394462}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9907154282943553, "4": 0.008875949175386559, "3": 0.0002071620957258028, "1": 0.00019790627458937207, "2": 0}, "score": 4.989918065701998}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9638987567550774, "4": 0.03451554764786819, "3": 0.0012763880830238524, "1": 0.00029799823329998014, "2": 0}, "score": 4.961739250551327}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"5": 0.917251234387033, "4": 0.0704416338996944, "3": 0.011436635910994013, "1": 0.0008046107000028791, "2": 5.970904747817243e-05}, "score": 4.903286927030633}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9850431467128642, "4": 0.01382597789859068, "3": 0.0010372498949797876, "1": 8.87538278353224e-05, "2": 2.742662209402717e-06}, "score": 4.983736244387887}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9753048111708316, "4": 0.021548889394037006, "3": 0.002503592947152743, "1": 0.0006268432804561598, "2": 9.76626947036169e-06}, "score": 4.970907075403664}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9893064494190459, "4": 0.009858939223289778, "3": 0.0006663767211297991, "1": 0.00016148311045441195, "2": 3.262195901265149e-06}, "score": 4.988152546965255}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916506168406445, "4": 0.007978486876286184, "3": 0.00028459427171665416, "1": 8.452307364397814e-05, "2": 0}, "score": 4.99111421647845}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9344474097697006, "4": 0.054783353468404364, "3": 0.006672406430090711, "1": 0.003981769342721074, "2": 0.00010843832280768857}, "score": 4.915618882504124}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9909189490799164, "4": 0.008086081731789188, "3": 0.000689744306045432, "1": 0.00030066796752478887, "2": 2.1483939391897665e-06}, "score": 4.989325286893935}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9957879174085866, "4": 0.0039872839267032735, "3": 0.00012283777199639608, "1": 9.996474341421378e-05, "2": 0}, "score": 4.995367172307832}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967604113280797, "4": 0.003178811163641758, "1": 3.137111477665121e-05, "3": 2.8260400749646474e-05, "2": 0}, "score": 4.996639179724277}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955426934086926, "4": 0.00418913797543745, "1": 0.00017725857778739753, "3": 8.902939160477391e-05, "2": 0}, "score": 4.994923759383589}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9212946904410979, "4": 0.07214817417804928, "3": 0.006019273548196777, "1": 0.0005216159337420806, "2": 1.3042973478079403e-05}, "score": 4.9136874096173635}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.970263314573167, "4": 0.028632704513870615, "3": 0.0010157033000337751, "1": 8.544779100956165e-05, "2": 0}, "score": 4.968994009980593}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9116583183855708, "4": 0.08296497899885534, "3": 0.004951184688631377, "1": 0.0004013502782908439, "2": 1.6650105586939502e-05}, "score": 4.90547658961015}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975370131417594, "4": 0.0023706620899536287, "3": 4.703417936589479e-05, "1": 4.4602662652124197e-05, "2": 0}, "score": 4.997356857082418}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9197912379131676, "4": 0.07834293394625924, "3": 0.0015794796841627646, "1": 0.0002793965385743525, "2": 3.6665551057552407e-06}, "score": 4.917369249393811}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9162384652009512, "4": 0.062173028418031975, "3": 0.019823047560866808, "1": 0.001666215153197283, "2": 9.341375068104591e-05}, "score": 4.891235140505378}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9787076500877391, "4": 0.01912395387714201, "3": 0.002086904523785314, "1": 7.766304694586505e-05, "2": 2.6855070564314804e-06}, "score": 4.976383501373684}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8728941753679563, "4": 0.10472266593081885, "3": 0.019620663654681274, "1": 0.002674242811032069, "2": 7.904683761336723e-05}, "score": 4.845100469091034}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9923918158741876, "4": 0.007176171179964885, "3": 0.00035257929875668936, "1": 7.495624609975503e-05, "2": 0}, "score": 4.991818808607648}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9843962794330096, "4": 0.01454348284705441, "3": 0.0009777297063529428, "1": 7.799077558491582e-05, "2": 0}, "score": 4.983189018698696}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6392047713454301, "4": 0.19406201617452334, "3": 0.12002835169272717, "1": 0.043744823201611174, "2": 0.0029270848001426587}, "score": 4.382100371719198}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999376395122396, "4": 0.0005921361301126467, "3": 2.1376422406973704e-05, "1": 9.681487510901701e-06, "2": 0}, "score": 4.999326384798284}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987990632024664, "4": 0.0008539388251972313, "3": 0.00018285226979858818, "1": 0.00016222829278838606, "2": 0}, "score": 4.9981314398812575}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972097200875749, "4": 0.0025414672684287752, "3": 0.00014715324959123794, "1": 0.00010001233795868178, "2": 9.3446375149551e-07}, "score": 4.996761371181478}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9835204237235587, "4": 0.013881055251891955, "3": 0.0018809199250200235, "1": 0.0007001597742759911, "2": 1.4544305725789223e-05}, "score": 4.979512773531892}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9800105579080408, "4": 0.017349747951254626, "3": 0.002467605578333908, "1": 0.0001611332331669228, "2": 0}, "score": 4.977070256756524}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9767443505402035, "4": 0.021068222845019982, "3": 0.001726344693003969, "1": 0.00043984947141743744, "2": 0}, "score": 4.973719131876075}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.959762370394627, "4": 0.03787042555017254, "3": 0.0019763135758795653, "1": 0.0003826943228914411, "2": 0}, "score": 4.956645814668819}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9929134846094629, "4": 0.0065515586225577595, "3": 0.00032933272369986474, "1": 0.00020014389001927867, "2": 0}, "score": 4.991989156469307}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9471632539489782, "4": 0.05056016832177731, "3": 0.002046457560188171, "1": 0.0002231648102627293, "2": 0}, "score": 4.944453870973538}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9762073728067392, "4": 0.02281606011454094, "3": 0.0006724238413260682, "1": 0.00029776707637142735, "2": 3.4672561904682355e-06}, "score": 4.974637548351792}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.99398685177857, "4": 0.005763588469961402, "1": 0.00014588863518799565, "3": 9.870548901012631e-05, "2": 0}, "score": 4.993455413513289}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918484257448834, "4": 0.007535711691027194, "3": 0.00033779410665430506, "1": 0.000272063245085464, "2": 0}, "score": 4.990700391269197}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9741868860018311, "4": 0.02504295070590747, "3": 0.0006195689894376536, "1": 0.00014467452409300258, "2": 0}, "score": 4.97313905420799}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9809592397246677, "4": 0.018453264250472143, "3": 0.00033550322133634125, "1": 0.00023963107615194206, "2": 0}, "score": 4.9799169567411425}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9777481416378196, "4": 0.020501115083500384, "3": 0.0015155552583597481, "1": 0.000222709795385619, "2": 7.480544309317962e-06}, "score": 4.975554371413865}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9669992878326532, "4": 0.03149191288253858, "3": 0.0011882226022060258, "1": 0.00030644324224908125, "2": 0}, "score": 4.964905372936235}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9587981249935585, "4": 0.03875629828512757, "3": 0.0022874605657033, "1": 0.00014584210413546826, "2": 8.56423283466133e-06}, "score": 4.956059556457343}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986463952504614, "4": 0.001300807569599307, "1": 3.30024089723494e-05, "3": 1.8968601469663807e-05, "2": 0}, "score": 4.9985292443764795}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9956206842914123, "4": 0.004238172995029223, "3": 8.300290091461056e-05, "1": 5.514833517153049e-05, "2": 0}, "score": 4.995375214027512}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9257703104264715, "4": 0.06963662004070623, "3": 0.004095645265900998, "1": 0.0004813927947549286, "2": 1.1119669397771796e-05}, "score": 4.920212767341129}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9687898942511729, "4": 0.029591695927545368, "3": 0.001173702026815214, "1": 0.00042730915086178217, "2": 0}, "score": 4.966351077969775}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9100145104945176, "4": 0.0846020822321228, "3": 0.0050384237189159105, "1": 0.000332045350660996, "2": 9.212631743826747e-06}, "score": 4.90396489324646}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9892943111980298, "4": 0.01044770648269234, "3": 0.00018150560920974918, "1": 6.961050974083966e-05, "2": 0}, "score": 4.98891076411901}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9518517605722667, "4": 0.04669151604887984, "3": 0.0012794250265219444, "1": 0.0001694584150808996, "2": 0}, "score": 4.950071408800731}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.999423184721932, "4": 0.00057399073665881, "3": 2.393085548977164e-06, "1": 2.498090527299135e-07, "2": 0}, "score": 4.999420223750717}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997699073453761, "4": 0.00022861138607312303, "3": 1.0228139035563477e-06, "1": 1.1727232999902677e-07, "2": 0}, "score": 4.999768873817943}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997763428849825, "4": 0.00022147640452497026, "3": 1.5715518300385515e-06, "1": 2.82015021414402e-07, "2": 0}, "score": 4.999774252357878}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9802481883131287, "4": 0.019482017857859562, "3": 0.00025301064374078433, "1": 1.5911236503475147e-05, "2": 3.9063938169276547e-07}, "score": 4.979947134338866}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9892967666295573, "4": 0.010585152154067903, "3": 0.00010941112304203645, "1": 8.120717870511149e-06, "2": 0}, "score": 4.989163536775079}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9659982049511198, "4": 0.03033212187857193, "3": 0.002535537076200965, "1": 0.0011238275101585183, "2": 7.67108877689786e-06}, "score": 4.96007837536897}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9516343948269249, "4": 0.039698991286988096, "3": 0.0079714513589869, "1": 0.0006755428284386552, "2": 1.8193466715556468e-05}, "score": 4.941601270991004}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9577334649734062, "4": 0.037807238499257906, "3": 0.003873066920013133, "1": 0.0005702372817419019, "2": 1.2126917370415718e-05}, "score": 4.952129112741116}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9704618750184342, "4": 0.028901964800449, "3": 0.0005646293837595925, "1": 6.97209298836254e-05, "2": 0}, "score": 4.969689837855121}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9540943691324558, "4": 0.04133829371549072, "3": 0.0036160807695132303, "1": 0.0009340496151506532, "2": 1.1719645754470354e-05}, "score": 4.9476579001401495}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"5": 0.996544777068619, "4": 0.0032681062182110966, "1": 9.31297384383092e-05, "3": 8.983058953135589e-05, "2": 0}, "score": 4.996179697770326}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9624002062631953, "4": 0.03187352344087625, "3": 0.004136982175785739, "1": 0.0015457856292148073, "2": 2.7617774193424074e-05}, "score": 4.9535857790913616}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9876475674290728, "4": 0.011373143912348515, "3": 0.000759479293219932, "1": 0.00021492423226858803, "2": 2.2055999497935392e-06}, "score": 4.986241546906057}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990431886492599, "4": 0.009232503796751512, "3": 0.0002704550898213815, "1": 5.534800183518125e-05, "2": 0}, "score": 4.990005096000049}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9791060984629018, "4": 0.020293314137813802, "3": 0.0005474509441576318, "1": 5.1305889874990695e-05, "2": 1.2217088286914175e-06}, "score": 4.978402882138341}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"5": 0.996760173899778, "4": 0.0029207159628497907, "3": 0.00018298525173180764, "1": 0.00013534465945206614, "2": 5.991714816009213e-07}, "score": 4.9961701366880185}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9863363744503082, "4": 0.012850678082075913, "3": 0.0007176362736016049, "1": 9.230077684210886e-05, "2": 2.3780327207814498e-06}, "score": 4.9853377028929815}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9980817665659336, "4": 0.0017785237726138752, "3": 7.822768069225092e-05, "1": 6.0865624545220974e-05, "2": 0}, "score": 4.997821557025123}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951922677213538, "4": 0.0041777715358586945, "1": 0.0003792568037057666, "3": 0.0002480158258311563, "2": 1.4080680083640157e-06}, "score": 4.993804937463671}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969659341092395, "4": 0.0028282860127825373, "1": 0.00013563121633389033, "3": 6.836914032366195e-05, "2": 0}, "score": 4.996492444599465}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9476562196462038, "5": 0.024030377976459873, "4": 0.011920134903514979, "3": 0.011665879265115725, "2": 0.004726143673611375}, "score": 1.1599400178711925}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9940331450110089, "4": 0.005792047633017259, "3": 0.00014044087166660332, "1": 3.0568790126363306e-05, "2": 0}, "score": 4.9938047719355625}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.986907754897409, "4": 0.012655031447524875, "3": 0.00034807259278042246, "1": 8.640335948343997e-05, "2": 0}, "score": 4.986303172431137}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.984545665026991, "4": 0.014384155366060386, "3": 0.0006576234860919785, "1": 0.0003986428718093664, "2": 0}, "score": 4.982705785555806}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9958718450546803, "4": 0.0039290720522571045, "1": 0.00015335408950093333, "3": 4.288126674544058e-05, "2": 0}, "score": 4.995371735877096}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9846015966857977, "4": 0.014323911576014328, "3": 0.0009300464749509937, "1": 0.0001411924082902986, "2": 2.476939085020149e-06}, "score": 4.983243782022253}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9876815203730952, "4": 0.010258976505650545, "1": 0.0011431870034316154, "3": 0.0009078497196991756, "2": 4.2541056757187684e-06}, "score": 4.983339743546325}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9929595613323349, "4": 0.005670628618088887, "1": 0.0006982104474495729, "3": 0.0006672792059579033, "2": 2.6833997606140027e-06}, "score": 4.990193904928374}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962090269507489, "4": 0.0034856456029644426, "3": 0.0001573548676116027, "1": 0.0001453249919165675, "2": 0}, "score": 4.9956183330933035}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9789368804729974, "4": 0.01755933432662958, "1": 0.002324028910722329, "3": 0.001167155951585233, "2": 1.1302190516669094e-05}, "score": 4.970776293619078}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9638256613006286, "4": 0.03422985029337004, "3": 0.001750901816615727, "1": 0.00018363122930288055, "2": 4.6842066262370516e-06}, "score": 4.961519565700034}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9792909251190491, "4": 0.019736448007451102, "3": 0.0006844899469837083, "1": 0.00026758628042215603, "2": 0}, "score": 4.977823771241064}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9440973784679849, "4": 0.05435719453644423, "3": 0.0013779863666737845, "1": 0.00015346431400765212, "2": 0}, "score": 4.9422721686518285}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9790326202865846, "4": 0.020070728878844944, "3": 0.0006027265178617039, "1": 0.00028166222179758926, "2": 0}, "score": 4.977596894489235}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9858640216173796, "4": 0.013178923895717086, "3": 0.0005508364041862469, "1": 0.00040135549587837595, "2": 2.7873172050275832e-06}, "score": 4.984105586375588}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9922918032011689, "4": 0.006717474590933868, "3": 0.0006812474194209087, "1": 0.0002925274644923341, "2": 0}, "score": 4.990749763945508}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9914434028515074, "4": 0.007877599921465698, "3": 0.00038840859210393026, "1": 0.00027191419527053645, "2": 0}, "score": 4.990257744182076}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984666757446773, "4": 0.0012657606919800276, "1": 0.00019883862338331007, "3": 6.419649139050699e-05, "2": 0}, "score": 4.997810481916585}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981821263375481, "4": 0.0016751279978463867, "1": 7.201875404630779e-05, "3": 6.583071731948197e-05, "2": 0}, "score": 4.997905125294419}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.994478828004695, "4": 0.004719070154298051, "1": 0.0005791481157883, "3": 0.00021245996231223534, "2": 0}, "score": 4.992539339167518}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9540225313933604, "4": 0.03948325977774645, "3": 0.005735338537870181, "1": 0.0007432664230974114, "2": 1.500579647261233e-05}, "score": 4.946027947785561}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9671020727482125, "4": 0.026970629536515783, "3": 0.004518202686256633, "1": 0.0013860753702544248, "2": 1.9365914920990276e-05}, "score": 4.958390413834421}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9633971664386155, "4": 0.03392752320671475, "3": 0.002293656522787488, "1": 0.00037389557902550984, "2": 6.738804652700681e-06}, "score": 4.959969324208449}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.899622471296373, "4": 0.08995773770456268, "3": 0.009782805256715802, "1": 0.0006206292967040501, "2": 1.5361948236104343e-05}, "score": 4.887947937314996}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8760604881763443, "4": 0.09400760459852989, "3": 0.028198485729931274, "1": 0.0016450600349835738, "2": 8.769554132134797e-05}, "score": 4.842751992463289}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8640353039151195, "4": 0.09802365028382905, "3": 0.03429598455605035, "1": 0.0030135695675745627, "2": 0.00038576491597600135}, "score": 4.820128608371302}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9694562787651689, "4": 0.02726145988606692, "3": 0.0026104660770696416, "1": 0.000624231228338386, "2": 2.295182738520326e-05}, "score": 4.964950964929863}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9408010328463453, "4": 0.049938901038969516, "3": 0.007652376697368247, "1": 0.0015474179125722948, "2": 4.966296865846118e-05}, "score": 4.928416925618402}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9871496647756632, "4": 0.011767932871789018, "3": 0.000647064679593547, "1": 0.0004310651151661673, "2": 3.268681059956082e-06}, "score": 4.985203856411676}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.970880144915525, "4": 0.02546012694013069, "3": 0.0025225936009569024, "1": 0.0011008368672736956, "2": 2.2039175139333337e-05}, "score": 4.965024722168411}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9685731207669642, "4": 0.028444575625939297, "3": 0.0028149071554853466, "1": 0.00015689009964391597, "2": 8.547369356161607e-06}, "score": 4.965272339525562}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9038918687128618, "4": 0.08477291379518846, "3": 0.011069149106839357, "1": 0.0002490838428259261, "2": 1.3166958637120386e-05}, "score": 4.892052539645459}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9563232906130719, "4": 0.03742700785557487, "3": 0.006012194233371092, "1": 0.0002228833539084925, "2": 1.1079777035471511e-05}, "score": 4.949623652388752}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984099923037494, "4": 0.001532372026504461, "3": 3.188920521359446e-05, "1": 2.5275828858124694e-05, "2": 0}, "score": 4.9983027454488465}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9362947670688414, "4": 0.060886914255902445, "3": 0.002411491121971171, "1": 0.00039630259885193404, "2": 5.315242083408419e-06}, "score": 4.932688596705448}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9885244151359555, "4": 0.011021614275559031, "3": 0.00039311278599631663, "1": 5.74857193579124e-05, "2": 0}, "score": 4.987962176682475}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9926302107656215, "4": 0.007171574879671905, "3": 0.0001707855298579429, "1": 2.393616650351708e-05, "2": 0}, "score": 4.992391082819251}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9690488621764434, "4": 0.028935062035443045, "3": 0.0016260866158415977, "1": 0.00038322012307599767, "2": 3.868800682943605e-06}, "score": 4.966268180007859}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878883289508765, "4": 0.011607080257989197, "3": 0.0004145574467952029, "1": 8.817580079506863e-05, "2": 1.0079258021525664e-06}, "score": 4.987208066999581}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9940102927498994, "4": 0.005853707838321494, "3": 8.485547862606605e-05, "1": 4.91192766703649e-05, "2": 0}, "score": 4.993780091504567}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7128282864792831, "4": 0.24622096857294923, "3": 0.03654400968228263, "1": 0.004210474204426462, "2": 0.00014811952630097927}, "score": 4.663388551674138}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.910459178478706, "4": 0.08342879211488995, "3": 0.003084095060463801, "1": 0.002966069806421585, "2": 4.666836648536734e-05}, "score": 4.89839718946515}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9076645236468547, "4": 0.08473318156716318, "3": 0.006304205680348315, "1": 0.0012414391096626854, "2": 3.3913479406437974e-05}, "score": 4.897588581716361}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9843434965352587, "4": 0.01526112551420469, "3": 0.00025466846397431523, "1": 0.00013381785148490472, "2": 0}, "score": 4.983694153777966}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9701199212224944, "4": 0.029032366068867846, "3": 0.0005908865628578956, "1": 0.0002475878721443201, "2": 0}, "score": 4.968795221038553}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9427918683097961, "4": 0.05128812167052212, "3": 0.005798956450182872, "1": 0.00011021605303837407, "2": 7.921206720853396e-06}, "score": 4.936649152846103}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9879753568547934, "4": 0.011128409789034217, "3": 0.0008210988941839348, "1": 7.272713477065576e-05, "2": 1.4252590090832079e-06}, "score": 4.986934195274977}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9656376969862014, "4": 0.030785428549237617, "3": 0.0034778409305257618, "1": 9.154801218212662e-05, "2": 4.920423273309787e-06}, "score": 4.961877838484061}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878693705678714, "4": 0.011803274334831127, "3": 0.0002852376116396208, "1": 3.837459138735947e-05, "2": 0}, "score": 4.987472705188001}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830793340879759, "4": 0.015983073867133504, "3": 0.0007245346291770273, "1": 0.00020529573677202138, "2": 4.2532804592662605e-06}, "score": 4.981733850001114}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9721765570123231, "4": 0.02489873450239514, "3": 0.0025337851185202195, "1": 0.00036900033723801667, "2": 1.550723296468656e-05}, "score": 4.968510970185509}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9831511073977495, "4": 0.015841132483199984, "3": 0.000837373458507795, "1": 0.0001626590932097311, "2": 0}, "score": 4.981833343842887}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9007645601594839, "4": 0.0907770117489515, "3": 0.008165747560870051, "1": 0.00026248463788183774, "2": 2.1012522257072513e-05}, "score": 4.891777523163903}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9775005602275179, "4": 0.02119976462415507, "3": 0.001071968393975474, "1": 0.00022199559913604409, "2": 2.917393433798573e-06}, "score": 4.975759496288855}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9589278821704572, "4": 0.03875429076087174, "3": 0.0020569746338727837, "1": 0.0002511035886968089, "2": 6.9844521547939414e-06}, "score": 4.956106270920571}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9603485639237197, "4": 0.03809312725991587, "3": 0.001367635831861726, "1": 0.00018067603360763458, "2": 0}, "score": 4.95844848155344}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9194605588361932, "4": 0.07379266814055317, "3": 0.006556033554353099, "1": 0.00016977390104394092, "2": 1.2054385769170685e-05}, "score": 4.912379225184578}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9543869040024328, "4": 0.03939999064952412, "3": 0.00566691160565971, "1": 0.0005300386656619368, "2": 1.4095189345019374e-05}, "score": 4.947103636947922}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9880253980859012, "4": 0.011703375201731021, "3": 0.00022288357679195768, "1": 4.640798606834416e-05, "2": 0}, "score": 4.987665201830732}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9912184708542315, "4": 0.008079009504824396, "3": 0.0005143007226863323, "1": 0.00018506822816211129, "2": 2.016395593642389e-06}, "score": 4.990146055773099}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9673001197455913, "4": 0.029812646389679183, "3": 0.0018589508677307012, "1": 0.001012678579217436, "2": 1.0813523837669742e-05}, "score": 4.962386116782351}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9850948401784214, "4": 0.013987272080357445, "3": 0.0004976413107446718, "1": 0.00040919640883023807, "2": 5.198234548121956e-06}, "score": 4.983364967614519}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918493650257874, "4": 0.0074465041375621375, "1": 0.00036012801229961747, "3": 0.00033676227229401855, "2": 0}, "score": 4.990439390044558}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.960073226332061, "4": 0.034645151187742126, "3": 0.003653582813847579, "1": 0.001527986077290801, "2": 4.260201522741374e-05}, "score": 4.951805163960535}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9880444780285894, "4": 0.011450948660139845, "3": 0.0003200136201844106, "1": 0.00017799795437740417, "2": 0}, "score": 4.987196948271728}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6982558472795042, "4": 0.27215364522925195, "3": 0.028343240714629313, "1": 0.0011795562152675384, "2": 6.035444255239838e-05}, "score": 4.666258130107921}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9818645784068121, "4": 0.01690651886113914, "3": 0.0007068620721477116, "1": 0.0005145180091992757, "2": 0}, "score": 4.979621531657668}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9877913072753787, "4": 0.011647519967015635, "3": 0.00039488735932366, "1": 0.00016291157321092633, "2": 0}, "score": 4.986911014861547}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975220669571552, "4": 0.0023930004069438056, "3": 4.183409002404298e-05, "1": 4.18202452316846e-05, "2": 0}, "score": 4.997356047052315}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9965360194715991, "4": 0.0033490706149790234, "3": 5.952739090484066e-05, "1": 5.2862465912456114e-05, "2": 0}, "score": 4.9963204154668}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8404864479994344, "4": 0.130260719801018, "3": 0.027976511384162277, "1": 0.0012070782606352184, "2": 5.938249927536506e-05}, "score": 4.808777911429889}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9656952796788836, "4": 0.03066279035677649, "3": 0.002923374439390395, "1": 0.0006850041920087304, "2": 1.2688024019317515e-05}, "score": 4.960711560237494}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9889750857812876, "4": 0.00865083267210677, "1": 0.001359969916091221, "3": 0.0010088334657938065, "2": 3.1642958733313103e-06}, "score": 4.983882093773182}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9825488513489834, "4": 0.015521461497613362, "3": 0.001306856687910083, "1": 0.0006011640493663086, "2": 0}, "score": 4.979459723894933}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9630224575990597, "4": 0.030325670922331873, "3": 0.0047696612184018805, "1": 0.0018306265384254504, "2": 2.6846985907891073e-05}, "score": 4.952730790243483}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9693580293501892, "4": 0.028094521108454524, "3": 0.0023570345421544403, "1": 0.00017722330683999347, "2": 8.052169497887519e-06}, "score": 4.9664581876824725}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9972809740653895, "4": 0.0026150867709712174, "3": 8.169685919360531e-05, "1": 2.0320445729249695e-05, "2": 0}, "score": 4.997140232231654}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9530641536667603, "4": 0.04268466315349965, "3": 0.004075287429215344, "1": 0.0001495366566807496, "2": 1.8112903013358796e-05}, "score": 4.948511852071214}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9764780628471801, "4": 0.021727735519829625, "3": 0.0013668893065174946, "1": 0.0004139578917751028, "2": 8.138790306407377e-06}, "score": 4.9738581015822705}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9810453913479628, "4": 0.017858219509869138, "3": 0.0008911040129403003, "1": 0.00019506572595728503, "2": 5.506843315324429e-06}, "score": 4.979562692718439}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9612841011046124, "4": 0.03309449250567646, "3": 0.005059078130141663, "1": 0.0005341593795279354, "2": 1.759770609369676e-05}, "score": 4.954597440639296}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9054657018115081, "4": 0.08936830409422547, "3": 0.00505682734121143, "1": 0.0001002871486819196, "2": 7.121779029908097e-06}, "score": 4.900095351676612}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9174149416494862, "4": 0.07439928108691934, "3": 0.007853601991562965, "1": 0.0002947287842302476, "2": 3.176584188675841e-05}, "score": 4.908618783163037}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9462629961048359, "4": 0.05019106280032717, "3": 0.0030639081644223145, "1": 0.00047308664709572645, "2": 6.64804986292017e-06}, "score": 4.9417686963037255}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9351423455977143, "4": 0.05912249505511854, "3": 0.00533889487326377, "1": 0.00038181223561566314, "2": 8.919488108129946e-06}, "score": 4.928645313003909}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7553681746892613, "4": 0.16418917661518953, "3": 0.05590625549408326, "1": 0.02343227109707773, "2": 0.0010982887415710862}, "score": 4.6269721857770385}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9791889578432748, "4": 0.019350368804962405, "3": 0.001197688655452278, "1": 0.00024979474433143363, "2": 5.393133433149002e-06}, "score": 4.9772387180409225}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9885875556895564, "4": 0.01097187608190897, "3": 0.0003710530179653076, "1": 6.752882595911986e-05, "2": 9.299025883451581e-07}, "score": 4.988013100206614}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9851957318625104, "4": 0.014258771753481657, "3": 0.0004448103261642712, "1": 9.625881544032568e-05, "2": 0}, "score": 4.984466503561875}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9978816084652096, "4": 0.0020785598601479435, "3": 2.4553454519444095e-05, "1": 1.471389901013369e-05, "2": 0}, "score": 4.9978134764008715}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9815525393988662, "4": 0.01676543420342975, "3": 0.0014898244272919395, "1": 0.00018198095849768608, "2": 4.9697948319779265e-06}, "score": 4.979511976136439}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9388909506602979, "4": 0.054451379214359885, "3": 0.006156708368614611, "1": 0.00048153314120910173, "2": 1.3811037039335272e-05}, "score": 4.931267252260852}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9568405364424976, "4": 0.0355028536934692, "3": 0.006663969173190954, "1": 0.0009526499838498968, "2": 3.532548146161284e-05}, "score": 4.947252385500847}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9018400840928513, "4": 0.08559905804861083, "3": 0.009916427039843087, "1": 0.0025867733260695283, "2": 4.209885562287071e-05}, "score": 4.884092894643978}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9556173667835366, "4": 0.038065790017733164, "3": 0.005582134772698175, "1": 0.0007129280886997703, "2": 1.928978262311441e-05}, "score": 4.94786022887725}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9945684380648034, "4": 0.005181394761383958, "1": 0.000165774355254095, "3": 8.298854265477761e-05, "2": 0}, "score": 4.993989522291922}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9928644716379568, "4": 0.006819991864609397, "3": 0.00017272203322996117, "1": 0.00013970744504905773, "2": 0}, "score": 4.992275710289219}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9827285219191405, "4": 0.015743501531946858, "3": 0.0010081496077089397, "1": 0.0005119525566557324, "2": 0}, "score": 4.980192233052039}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991495179650336, "4": 0.000755766191591728, "1": 7.590203973081543e-05, "3": 1.7909289737363436e-05, "2": 0}, "score": 4.998904806079392}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9966686279745594, "4": 0.003187035833385538, "1": 9.519567955713402e-05, "3": 4.6331985678511116e-05, "2": 0}, "score": 4.996339507196437}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9959506000210685, "4": 0.0034654007377405184, "3": 0.0004708401056659218, "1": 0.00011247067915758285, "2": 0}, "score": 4.995143032990488}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9905392472040556, "4": 0.00788592542660417, "1": 0.0007982098700831066, "3": 0.0007730348703347906, "2": 3.0832602441161117e-06}, "score": 4.987365909262592}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9971124021538922, "4": 0.00196980977856191, "1": 0.0006037204489704589, "3": 0.0003117518622142991, "2": 1.717266114496176e-06}, "score": 4.9949866499023425}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988211829513322, "4": 0.0011195298036422708, "1": 3.980336904040587e-05, "3": 1.9248257900520346e-05, "2": 0}, "score": 4.998682759894029}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9957636826154774, "4": 0.0039406078142270335, "1": 0.00024137905928954745, "3": 5.3673347597589756e-05, "2": 0}, "score": 4.994986525958748}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6144072174905381, "4": 0.29947755673822013, "3": 0.07111846295527337, "1": 0.014093959184924655, "2": 0.0008984711152532832}, "score": 4.49921209759428}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9781189065483015, "4": 0.021071990180054387, "3": 0.00040354966190348716, "1": 0.0003977334104903422, "2": 0}, "score": 4.976529793312486}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9651670575441914, "4": 0.03343628805723665, "1": 0.0006977843200600255, "3": 0.000688078931908729, "2": 5.342376321237587e-06}, "score": 4.962380184688011}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9804387121800238, "4": 0.0189501922952233, "3": 0.00037971734916520376, "1": 0.00022815416391030213, "2": 0}, "score": 4.979377689864236}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.985925314688879, "4": 0.013354221859142357, "3": 0.0004135924869291331, "1": 0.000300722694074843, "2": 2.999199914596909e-06}, "score": 4.984606656316223}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9815480733449722, "2": 0.009879480989789562, "3": 0.007446124375535135, "4": 0.0007558101784640848, "5": 0.00036873770250696254}, "score": 1.028514161653543}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8586139722760602, "4": 0.12791913148453596, "3": 0.011965778439766286, "1": 0.0014460493893285332, "2": 4.0982516870277435e-05}, "score": 4.842239944336674}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9925160498679066, "4": 0.006913637283670004, "3": 0.0004289617516517093, "1": 0.00013767083165175883, "2": 2.2222596930859185e-06}, "score": 4.991671076963725}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9913383035244777, "4": 0.008213851849096055, "3": 0.00026910928417242573, "1": 0.00017056535856544222, "2": 0}, "score": 4.99056559106933}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.873709227786876, "4": 0.11568427105057655, "3": 0.009510840744221576, "1": 0.001055354024603523, "2": 3.147688786523053e-05}, "score": 4.860976973194341}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9856018984673887, "4": 0.009939813709383427, "1": 0.0026220416734569004, "3": 0.0018218664161202775, "2": 1.1913611356859227e-05}, "score": 4.9758924864784}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9890770059042475, "4": 0.00980643672731977, "1": 0.0006761247212828626, "3": 0.0004314680043569957, "2": 4.432095769992216e-06}, "score": 4.986612771413282}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9923408687785501, "4": 0.007080850155676299, "3": 0.0003288723093543372, "1": 0.00024470405899874317, "2": 0}, "score": 4.991282547976646}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977134309907943, "4": 0.0018895686565599697, "1": 0.00031719304331046287, "3": 7.835282763688501e-05, "2": 0}, "score": 4.996684948693242}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951908515637644, "4": 0.003786099293676336, "1": 0.0008196312614511513, "3": 0.00020078959283516048, "2": 0}, "score": 4.992533776851462}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8853234327537648, "4": 0.09584023429218778, "3": 0.017736253744881008, "1": 0.0010070711624167571, "2": 7.874569093825582e-05}, "score": 4.864420802816817}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.978882615590039, "4": 0.019731080423617566, "3": 0.0011285895632398913, "1": 0.00025231733419008804, "2": 4.348406942733017e-06}, "score": 4.976989401761515}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9800743331901199, "4": 0.0180907521901483, "3": 0.0015818049666683324, "1": 0.00024519420204537377, "2": 4.014583307045215e-06}, "score": 4.977752730534757}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9857027681557871, "4": 0.013704181140125345, "3": 0.0004750624447207876, "1": 0.00011531990603661867, "2": 1.3751482699064852e-06}, "score": 4.984880269348563}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9775042063114074, "4": 0.021022667891762846, "3": 0.0012655603379209284, "1": 0.00019740995532349618, "2": 0}, "score": 4.975656324388817}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8915788135803518, "4": 0.0861264598008326, "3": 0.021893871970825533, "1": 0.00035280290490776096, "2": 4.469101872100607e-05}, "score": 4.868540069781132}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8027103740371012, "4": 0.14912878760896467, "3": 0.047537495518533555, "1": 0.0005605893034243982, "2": 5.8147655381095765e-05}, "score": 4.753378285264943}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9506936081014143, "4": 0.04432337893238801, "3": 0.0045168474287495455, "1": 0.0004407817513131002, "2": 1.5434766933416356e-05}, "score": 4.944832946045981}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9432257428815616, "4": 0.05366560422024723, "3": 0.0029116230620601837, "1": 0.00018033271439178665, "2": 8.298016895189958e-06}, "score": 4.939764418822418}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8572908897762899, "4": 0.12931758511702035, "3": 0.012549493158459392, "1": 0.0008003591448285885, "2": 3.4902608131030605e-05}, "score": 4.842276216341539}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9805087317303737, "4": 0.018455030312365624, "3": 0.000982782228500072, "1": 5.150194417686743e-05, "2": 0}, "score": 4.97937335715391}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9893275663905787, "4": 0.00976035994135467, "3": 0.000818675800880724, "1": 9.01550132289798e-05, "2": 0}, "score": 4.9882416302732935}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9910099126778562, "4": 0.008575067622117523, "3": 0.0003396052310780855, "1": 7.129302937855139e-05, "2": 0}, "score": 4.990460510481781}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967893083296515, "4": 0.002939899152766408, "3": 0.00022681315163120377, "1": 4.294269523573875e-05, "2": 4.742282931880477e-07}, "score": 4.996433279072074}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9912782104179586, "4": 0.00808936534750118, "3": 0.0005651762096240909, "1": 6.41620271291127e-05, "2": 0}, "score": 4.990523604880599}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9833198158540187, "4": 0.015674266309031185, "3": 0.0008900967440196111, "1": 0.00011094788182779967, "2": 2.298136455930896e-06}, "score": 4.982094808159045}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9816559239196575, "4": 0.01767202673535851, "3": 0.000609835078784407, "1": 5.914739553732464e-05, "2": 2.368665124744633e-06}, "score": 4.980864594169104}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9870495393147153, "4": 0.012508919864469585, "3": 0.00036696392930958603, "1": 7.023561776739999e-05, "2": 0}, "score": 4.986476151095112}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993784203107439, "4": 0.0006163327263964603, "1": 1.2876612107679085e-06, "3": 1.1359832301115783e-06, "2": 0}, "score": 4.999376242901235}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982655159590706, "4": 0.001703024484720613, "3": 2.240684646599712e-05, "1": 7.385041666146719e-06, "2": 0}, "score": 4.9982226186915995}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9922423993137013, "4": 0.006600147379313879, "3": 0.000959453889952576, "1": 0.0001881406945051288, "2": 5.510142902598045e-06}, "score": 4.990711811243624}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9940630596957892, "4": 0.005727841619116363, "3": 0.0001530960585372635, "1": 5.1373427186047947e-05, "2": 0}, "score": 4.993760443670914}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9966962155459825, "4": 0.003169254158519657, "3": 9.668589786572033e-05, "1": 3.459598233943874e-05, "2": 0}, "score": 4.996498978743621}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9955158754426187, "4": 0.004316081277891545, "3": 0.00012053685514150119, "1": 4.450255298447766e-05, "2": 0}, "score": 4.995264820576018}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9866093305003737, "4": 0.01306736994474872, "3": 0.0002571960303031632, "1": 6.127228119972619e-05, "2": 0}, "score": 4.986173082068641}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.909199706331856, "4": 0.07046105028945276, "3": 0.020009976596047453, "1": 0.0003055989306072063, "2": 2.135507802428343e-05}, "score": 4.888232277068467}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9805910341847515, "4": 0.01839743180360226, "3": 0.0009976057497823804, "1": 1.2526852722207278e-05, "2": 8.293330611092318e-07}, "score": 4.979554749590523}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.980962097263095, "4": 0.01813520866699475, "3": 0.0008436433700506084, "1": 5.6519321772431344e-05, "2": 1.4970830147342613e-06}, "score": 4.979946915315963}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974206543432466, "4": 0.0025316940888222023, "3": 3.410474615257289e-05, "1": 1.1795953606555869e-05, "2": 0}, "score": 4.997352907969736}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9432865187605616, "4": 0.05583990621836338, "3": 0.000794246016699023, "1": 7.422511410725286e-05, "2": 0}, "score": 4.942274406666716}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9624962662966822, "4": 0.0342795881369319, "3": 0.00299576845807585, "1": 0.00021002037671036117, "2": 1.2545098831729472e-05}, "score": 4.958850919000232}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9822340842838647, "4": 0.016743469120446934, "3": 0.0009437134373805011, "1": 7.004196468784061e-05, "2": 0}, "score": 4.981088771784895}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9895463868084022, "4": 0.00963537555182972, "3": 0.0005548992456874415, "1": 0.0002600129813307307, "2": 1.836270399856162e-06}, "score": 4.988209247662165}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9851890148209089, "4": 0.014207773991338435, "3": 0.000497878941424351, "1": 9.5492485446272e-05, "2": 0}, "score": 4.9844143448249065}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944086829255449, "4": 0.0053711120835133715, "3": 0.00016189169430279703, "1": 5.701181676210103e-05, "2": 0}, "score": 4.9940770495522315}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9912604042473915, "4": 0.008037819813812947, "3": 0.0005721393370545566, "1": 0.00012753598473122602, "2": 0}, "score": 4.990307737213421}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9976372556848765, "4": 0.002310150280664044, "3": 2.8053420232679083e-05, "1": 2.3881248226845936e-05, "2": 0}, "score": 4.997538216262748}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962214520460804, "4": 0.003610597528406919, "3": 0.000113602391495705, "1": 5.279363097507293e-05, "2": 0}, "score": 4.99595101687095}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988474669769418, "4": 0.001063243645856799, "1": 6.624828368997088e-05, "3": 2.0324388278136057e-05, "2": 0}, "score": 4.9986311107239585}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9958833161701802, "4": 0.003961799253342182, "1": 0.00010911578410684201, "3": 4.348728332347152e-05, "2": 0}, "score": 4.995514752810451}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8703955721824138, "4": 0.11382858528914297, "3": 0.01506793052390766, "1": 0.0006814416026052335, "2": 2.6070686432628647e-05}, "score": 4.8532315165276865}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7164638403854815, "4": 0.18827865614673042, "3": 0.08466190858718659, "1": 0.009993230152457452, "2": 0.0005954578217338702}, "score": 4.6006354742304625}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9182637318724522, "4": 0.06743589743184948, "3": 0.013797539497478431, "1": 0.0004732003907971334, "2": 2.627199539436789e-05}, "score": 4.902997080209249}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9065185497064139, "4": 0.08718963672731982, "3": 0.005717925009390722, "1": 0.0005529798470796168, "2": 1.8048066464564766e-05}, "score": 4.89910816105062}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9565245757676124, "4": 0.03891527624186258, "3": 0.003988021642466314, "1": 0.0005636455282856582, "2": 7.699362690481395e-06}, "score": 4.950830961848497}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9316857921731797, "4": 0.061373029456374316, "3": 0.00607919860548456, "1": 0.0006900986497086803, "2": 0}, "score": 4.923695063356212}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9617924240645186, "4": 0.03376632077606332, "3": 0.0038915061935794696, "1": 0.00043641933469623726, "2": 0}, "score": 4.9567000823342955}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9808265347261574, "4": 0.017528900553737826, "3": 0.0013590280552316265, "1": 0.0002643527955907944, "2": 1.1303625986015075e-05}, "score": 4.978661510446011}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.977245010476279, "4": 0.021843381707607593, "3": 0.0005256361051212905, "1": 0.0003727957781208841, "2": 6.408694332868345e-06}, "score": 4.975594771730666}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9743300182078063, "4": 0.023308606708174296, "3": 0.00208252745570121, "1": 0.0002591796778283169, "2": 1.1373107279307814e-05}, "score": 4.97145526357316}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9567905476145157, "4": 0.042079832124391744, "3": 0.000990646299556683, "1": 0.00013406604584476387, "2": 0}, "score": 4.955402392211817}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9176139459439934, "4": 0.0791815707333223, "3": 0.003025718484997705, "1": 0.00016763291482960597, "2": 0}, "score": 4.914095504355145}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9155795648634988, "4": 0.07926488979691239, "3": 0.004793297936410242, "1": 0.00034063313849596623, "2": 1.5331117062381784e-05}, "score": 4.909739421304557}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9913620879983733, "4": 0.008342828261631548, "3": 0.00023424148208598506, "1": 5.6676494061711225e-05, "2": 0}, "score": 4.990961945147547}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9811898658240992, "4": 0.018559947134218265, "3": 0.0002066962983000095, "1": 4.152154951822089e-05, "2": 0}, "score": 4.980860536381794}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"5": 0.40667005418277297, "4": 0.3163599599269725, "3": 0.27360661934882313, "1": 0.00239715298988327, "2": 0.000964549890649335}, "score": 4.123943082282261}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9240121851829234, "4": 0.0700072969655945, "3": 0.0056625101255385795, "1": 0.0002965069202503627, "2": 1.6463479397989203e-05}, "score": 4.917431848741414}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9357447712285116, "4": 0.05870566788471149, "3": 0.005320877742745156, "1": 0.00021703650342990097, "2": 9.961110466122735e-06}, "score": 4.929754428883653}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9746430349712938, "4": 0.023407935270049356, "3": 0.0018680690036542698, "1": 7.654398615136696e-05, "2": 3.522569017630058e-06}, "score": 4.972539158515505}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8996363525781989, "4": 0.0920676818614805, "3": 0.005284387290822304, "1": 0.0029921981334187714, "2": 1.7928086439444512e-05}, "score": 4.885340800273032}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9715715732013224, "4": 0.024599577770301542, "3": 0.0033830080826176565, "1": 0.00041863325823399605, "2": 1.7280514858156906e-05}, "score": 4.966907702974007}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9852590277955058, "4": 0.013160970626391063, "3": 0.0011152674916689862, "1": 0.0004416503730942116, "2": 0}, "score": 4.982841496815925}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9806778134667624, "4": 0.01588524639828651, "3": 0.003163124417972185, "1": 0.00025555344298445207, "2": 9.052505389014728e-06}, "score": 4.976738919248493}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935451314483347, "4": 0.0062428691662114455, "3": 0.000170012941047918, "1": 4.064783430579147e-05, "2": 0}, "score": 4.993254504584881}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9849152274660167, "4": 0.014241699972959316, "3": 0.0005915105728883524, "1": 0.00023986794865092653, "2": 0}, "score": 4.983615615487021}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8757062984545819, "4": 0.10407439489941582, "3": 0.01930240267281898, "1": 0.0007891840455487102, "2": 9.089959611227576e-05}, "score": 4.853885984817936}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9517408506042909, "4": 0.028644913237909513, "3": 0.0007062664385157404, "1": 0.00013136498024889976, "2": 0}, "score": 4.968831862159377}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9658271418171106, "4": 0.032030573834155286, "3": 0.0020123487636343846, "1": 0.00011848922853019174, "2": 6.946212576152838e-06}, "score": 4.963449768605421}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9064999354456275, "4": 0.08380855402775933, "3": 0.009158391647929465, "1": 0.00047537742048058435, "2": 3.5357995858886945e-05}, "score": 4.895864748099394}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9063961063571868, "4": 0.08882068650292987, "3": 0.004548305195110473, "1": 0.00021832473357040957, "2": 1.095772358627123e-05}, "score": 4.901175975661427}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9349744278130809, "4": 0.05660291462259359, "3": 0.007957773733222893, "1": 0.0004053732541901614, "2": 3.403320133400469e-05}, "score": 4.925756053749294}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9052192721147907, "4": 0.08886334843889958, "3": 0.005674114857649245, "1": 0.0002221568264594537, "2": 1.3923506932252305e-05}, "score": 4.898857297384174}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9448988748076618, "4": 0.052033064848731034, "3": 0.0026589438072055858, "1": 0.0003927373068505278, "2": 6.858656368915717e-06}, "score": 4.941056961168834}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9897225724239774, "4": 0.00988944057162958, "3": 0.0003426407622573767, "1": 4.032632808352419e-05, "2": 0}, "score": 4.989263918697317}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9404719624586356, "4": 0.05311034227103809, "3": 0.006198701155040013, "1": 0.0001921844442360165, "2": 1.5554462235842193e-05}, "score": 4.933676107765973}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9152920722470443, "4": 0.08016121376349906, "3": 0.004095294284141491, "1": 0.0004330988781614464, "2": 1.42511920801658e-05}, "score": 4.909872681794036}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9928138345576297, "4": 0.006964238570364954, "3": 0.0001482815094508917, "1": 7.261079178529852e-05, "2": 5.439883531338942e-07}, "score": 4.992447119573221}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9874007604536844, "4": 0.01187250566960684, "3": 0.0005486372947998047, "1": 0.000171632670757909, "2": 3.1982588679576384e-06}, "score": 4.986334049652916}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984747581654368, "4": 0.0013513029551885435, "1": 0.00014286806156544967, "3": 2.951070438287458e-05, "2": 0}, "score": 4.998018200297951}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9911061612611569, "4": 0.006014660339866771, "1": 6.0879199093000384e-05, "3": 3.4539671361951346e-05, "2": 0}, "score": 4.993655080791734}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9805771638226712, "4": 0.01659692237341603, "3": 0.001869252800296081, "1": 0.0009346616180576486, "2": 1.3336165534337811e-05}, "score": 4.975885708149742}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9951812861338265, "4": 0.0042753705584959835, "1": 0.0003131632305515987, "3": 0.00022830045761149074, "2": 9.74478871118886e-07}, "score": 4.994012446747884}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9910391845699468, "4": 0.008382819208524897, "1": 0.0003019805338853941, "3": 0.0002734791973151387, "2": 1.874928561127034e-06}, "score": 4.989856668765181}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9843746839843127, "4": 0.014509113641441621, "3": 0.0005762050333098218, "1": 0.0005338538209596132, "2": 3.7709635711396097e-06}, "score": 4.982191705866204}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998493653680246, "4": 0.001384049993455657, "1": 8.533840246759801e-05, "3": 3.549843311722329e-05, "2": 0}, "score": 4.998203596908606}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9873298765101358, "4": 0.012221266366029373, "3": 0.00028597905045062106, "1": 0.00015931439197907306, "2": 0}, "score": 4.986569470103024}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9992622336834982, "4": 0.000728435626995975, "3": 1.8042834962014046e-06, "1": 1.6157472739144033e-06, "2": 0}, "score": 4.999261488451827}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9701763460080776, "4": 0.02909947343458065, "3": 0.0006061470163986477, "1": 0.00011238658254562691, "2": 0}, "score": 4.969238512493599}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979644675118907, "4": 0.001993994032849254, "1": 1.936719311355496e-05, "3": 1.663131822519317e-05, "2": 0}, "score": 4.99789526289812}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951129380369894, "4": 0.00475062685580337, "3": 7.492791799307882e-05, "1": 5.64422819706229e-05, "2": 0}, "score": 4.994873722216205}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8797500376360952, "4": 0.09709340749160573, "3": 0.02264690456928822, "1": 0.000489526480705164, "2": 1.771666209301101e-05}, "score": 4.855601179869623}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9395182942429491, "4": 0.05589449964472374, "3": 0.003680233786054537, "1": 0.0008987051974666909, "2": 7.014143130871836e-06}, "score": 4.93312908577561}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9058248173215785, "4": 0.07954328023381085, "3": 0.008810800328239941, "1": 0.005740396467746389, "2": 7.438167129775797e-05}, "score": 4.879649627131802}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9891145539582408, "4": 0.01020715534723899, "1": 0.00044940916705043794, "3": 0.0002222045953121103, "2": 0}, "score": 4.987550715670909}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9844692918593891, "4": 0.013613090669032312, "1": 0.0012541653342096706, "3": 0.0006581940903482336, "2": 2.5985654895160794e-06}, "score": 4.9800460110497}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9902119657033741, "4": 0.009491448914356677, "3": 0.0002628111091465811, "1": 2.9098061532764064e-05, "2": 0}, "score": 4.989866489234778}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9421643711132627, "4": 0.054534922647688874, "3": 0.0032181391184726927, "1": 7.255011452999268e-05, "2": 6.485815476438207e-06}, "score": 4.938718924815662}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9712166801894464, "4": 0.0277619805618656, "3": 0.0009362905621617596, "1": 7.591122443328616e-05, "2": 0}, "score": 4.970061519854351}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9950390378232113, "4": 0.004881964883955796, "3": 6.209916594204372e-05, "1": 1.5486234893425434e-05, "2": 0}, "score": 4.994931884688956}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9983508201940111, "4": 0.0015888353745068438, "1": 3.959336516815476e-05, "3": 1.9996705959503014e-05, "2": 0}, "score": 4.998212796404705}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9887740020989685, "4": 0.01027218317229187, "3": 0.0006259884108842499, "1": 0.0003230960210912376, "2": 3.841133702161527e-06}, "score": 4.987171921114214}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9941339856430561, "4": 0.005304663179883376, "3": 0.00033767704750446107, "1": 0.00022062569061838064, "2": 1.8397607904224105e-06}, "score": 4.993131952379003}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9856824954154298, "4": 0.013101441718281117, "3": 0.0009009966666268648, "1": 0.00030802765193834304, "2": 4.882207909247275e-06}, "score": 4.983849772891607}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979209014258587, "4": 0.001881010775646426, "1": 0.00012308258563154274, "3": 7.395409463666853e-05, "2": 0}, "score": 4.99747874804242}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9983402396282507, "4": 0.001447686665013366, "3": 0.00012743386931014236, "1": 8.391107087315879e-05, "2": 0}, "score": 4.997961799827502}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9394364450956005, "4": 0.05235748876678376, "3": 0.007529143414617333, "1": 0.0006282640613602213, "2": 3.69307507612868e-05}, "score": 4.929959554478154}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9385954249197904, "4": 0.05633833892600774, "3": 0.004391541388357124, "1": 0.0006477450372966719, "2": 1.4759700947598749e-05}, "score": 4.932242493079369}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9648871832757732, "4": 0.032719030430706744, "3": 0.002057115541461232, "1": 0.00032432352708369175, "2": 7.815606421346926e-06}, "score": 4.961845824658603}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9807416743431338, "4": 0.01790912893089274, "3": 0.0012336432447974382, "1": 0.00010280557241918698, "2": 0}, "score": 4.979212097287548}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9634820416139169, "4": 0.03497941966533506, "3": 0.001389023217620637, "1": 0.00014493227407531782, "2": 3.180544975220024e-06}, "score": 4.961653209379765}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9765148972709, "4": 0.021495980818460245, "3": 0.001516622281592013, "1": 0.000460838915550017, "2": 9.569682783676851e-06}, "score": 4.973598654701781}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936544707472964, "4": 0.005882386688627759, "3": 0.00027475795816123166, "1": 0.00018649166715735722, "2": 1.14689760020135e-06}, "score": 4.992818684676062}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987745699533647, "4": 0.0011703575249163358, "3": 2.7391056581118113e-05, "1": 2.652741052816351e-05, "2": 0}, "score": 4.998668749183473}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986330771912114, "4": 0.0011755243213279714, "1": 0.0001491553765074773, "3": 4.080822107155844e-05, "2": 0}, "score": 4.998146235070551}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9902859670085955, "4": 0.008980434612595714, "3": 0.0005145159511313552, "1": 0.00021372231051263108, "2": 0}, "score": 4.989135586008559}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9512737337992628, "4": 0.04496197259118751, "3": 0.0034968511040603914, "1": 0.00024057371695002097, "2": 1.4786721143068226e-05}, "score": 4.947037030267292}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9860616036345546, "4": 0.012403829790303593, "3": 0.0011584261063821114, "1": 0.00036965083022047696, "2": 0}, "score": 4.9838006095478615}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9882577284469738, "4": 0.011016098236232518, "3": 0.000567248544610994, "1": 0.00015275442369069958, "2": 0}, "score": 4.987238308235698}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9922405213975134, "4": 0.007573048382919024, "3": 0.00013889768152888194, "1": 4.523158192314596e-05, "2": 0}, "score": 4.991968211445538}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9752303270608116, "4": 0.02372069512128913, "3": 0.0007935059655536873, "1": 0.00024379471957277453, "2": 0}, "score": 4.973716807156979}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9905812370527132, "4": 0.008426756818760175, "3": 0.000761487348261628, "1": 0.00022479223103382567, "2": 2.6562664801530955e-06}, "score": 4.98914309742738}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9957290545397673, "4": 0.004090343201911827, "3": 0.00011484478923923977, "1": 6.234195025169297e-05, "2": 0}, "score": 4.995430583811677}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9970905943476045, "4": 0.002724182216347051, "3": 0.00012286344777376858, "1": 6.010443052032812e-05, "2": 0}, "score": 4.99678966592493}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943748527232149, "4": 0.005225012963926926, "3": 0.0002089620294035072, "1": 0.0001836416965812654, "2": 0}, "score": 4.993622448164232}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9943479840833299, "4": 0.005319446619127113, "1": 0.00018706301860369436, "3": 0.00014024635544935068, "2": 0}, "score": 4.993651775204382}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9740149464754514, "4": 0.02450731584713122, "3": 0.0013769210440311667, "1": 9.621098669547934e-05, "2": 3.4466355694365243e-06}, "score": 4.97234362615727}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9917951867339809, "4": 0.0077916782955469175, "3": 0.00022593934040652394, "1": 0.00018511468611760924, "2": 0}, "score": 4.991015965583897}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9505808140458155, "4": 0.038106580318149015, "3": 0.010026680388857297, "1": 0.0011816836918481543, "2": 6.435898542666531e-05}, "score": 4.936917731297473}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967222698245976, "4": 0.0031118387175160236, "1": 0.00010029677671033113, "3": 6.350912256138909e-05, "2": 0}, "score": 4.99635994833898}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.971196784048333, "4": 0.026484823716046543, "3": 0.002133179477088856, "1": 0.00017693873769844727, "2": 6.904252719905719e-06}, "score": 4.968520306500942}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9966046828697964, "4": 0.0033358738831880536, "3": 4.484780103416588e-05, "1": 1.2904196363486229e-05, "2": 0}, "score": 4.996522807848488}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.996461677269449, "4": 0.0034172802254758793, "1": 6.212767600176936e-05, "3": 5.5307833768621355e-05, "2": 0}, "score": 4.996223579781449}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9977525912132886, "4": 0.0021227484314683413, "3": 6.483927775753893e-05, "1": 5.8872939742379326e-05, "2": 0}, "score": 4.997512078895155}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971113323525698, "4": 0.002816413533733783, "3": 3.61768914754832e-05, "1": 3.519420920905681e-05, "2": 0}, "score": 4.9969704531713495}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986221438166807, "4": 0.001233199829759562, "1": 0.00011827714510772863, "3": 2.5244127589614585e-05, "2": 0}, "score": 4.998243201340522}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9815781523650002, "4": 0.01769592308701974, "3": 0.0006232613030906421, "1": 9.843688269489219e-05, "2": 0}, "score": 4.980663725053918}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9736528321908786, "4": 0.0255075013369709, "3": 0.0006726216975234058, "1": 0.0001591430618854242, "2": 0}, "score": 4.972510465806038}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9615860388244181, "4": 0.0360167741656767, "3": 0.0020977555322231633, "1": 0.0002932523666633495, "2": 3.559743735861136e-06}, "score": 4.958603917640472}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9932673719826052, "4": 0.006565904530415438, "3": 0.0001189699045237389, "1": 4.5425678821828676e-05, "2": 0}, "score": 4.993014436683532}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.995674092808616, "4": 0.004137074845224373, "3": 0.00012617572244705378, "1": 6.101495865505847e-05, "2": 0}, "score": 4.995366506268616}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9711493305904156, "4": 0.026410133441433586, "3": 0.0018858794785888778, "1": 0.0005331682593673377, "2": 1.1730151262831262e-05}, "score": 4.967649928435578}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9811525636568617, "4": 0.017800993653710386, "3": 0.0006361771472470937, "1": 0.00040320316158710425, "2": 0}, "score": 4.979313693310877}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9842034078478651, "4": 0.01488483008146666, "3": 0.0004845186180616207, "1": 0.0004183017901254238, "2": 0}, "score": 4.982472768799323}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9900203069432323, "4": 0.009336031593057686, "1": 0.0003883455585047469, "3": 0.000246236032581983, "2": 0}, "score": 4.988618010760747}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9964670041685216, "4": 0.0033224613508344597, "1": 0.00012472690134947924, "3": 8.215535746215134e-05, "2": 0}, "score": 4.996014305772205}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8105326539248654, "4": 0.1553252614172243, "3": 0.03329058016304167, "1": 0.0007710652944377993, "2": 6.63306815062313e-05}, "score": 4.774807147896809}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.752864119241718, "4": 0.23194393407290703, "3": 0.015045873671968777, "1": 0.00013073554704263145, "2": 1.2693392188765476e-05}, "score": 4.73740260189142}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8527260872497899, "4": 0.11889066377800103, "3": 0.026618135760604685, "1": 0.0016522950799657246, "2": 9.053862524713516e-05}, "score": 4.820988280212431}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8510986539857519, "4": 0.13784366476805482, "3": 0.010698005037401384, "1": 0.00033615271242184156, "2": 1.8322220495076924e-05}, "score": 4.839359912112557}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9669833450468194, "4": 0.030256392334093666, "3": 0.002136632473260355, "1": 0.0006157293856284298, "2": 5.702333961515114e-06}, "score": 4.962990236811753}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9559941549676518, "4": 0.038973007026849346, "1": 0.003126394047702136, "3": 0.0018961956301749988, "2": 6.273507185336368e-06}, "score": 4.9447099852325564}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9926976403414642, "4": 0.007008675080552273, "3": 0.0002624780758479163, "1": 2.876092105695307e-05, "2": 0}, "score": 4.9923513063780245}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9853814774844247, "4": 0.011939512511903005, "3": 0.002036969733944075, "1": 0.0006350143251720358, "2": 5.513924157451355e-06}, "score": 4.98142992086871}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9950720928725503, "4": 0.004511674086487499, "1": 0.0002932684959870682, "3": 0.00012039590949026996, "2": 0}, "score": 4.994074444889993}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.995567390441283, "4": 0.00399606880450288, "1": 0.00026633810097334614, "3": 0.00016821544322247027, "2": 0}, "score": 4.994602137178473}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9613253055081039, "4": 0.03641824112701603, "3": 0.0016942135976475592, "1": 0.0005470509037500354, "2": 1.342443505525567e-05}, "score": 4.9579647805893865}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9976929000555143, "4": 0.0022634863988691416, "3": 2.7870800339521946e-05, "1": 1.4283421912965094e-05, "2": 0}, "score": 4.997623634844915}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9822745669136342, "4": 0.01646723878552019, "3": 0.0007150178861419528, "1": 0.0005351044481159057, "2": 0}, "score": 4.979962145904844}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979725424742519, "4": 0.0019165056980383027, "3": 5.820286369825555e-05, "1": 5.1792407127137926e-05, "2": 0}, "score": 4.99775991680329}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9879231205207338, "4": 0.011723029951042402, "1": 0.00021713375756673772, "3": 0.00013005111402212465, "2": 0}, "score": 4.987148247138127}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9784092494549366, "4": 0.017737461624888883, "3": 0.0035142037800178177, "1": 0.00032309375942700576, "2": 1.152095507865277e-05}, "score": 4.973907076265657}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9873592707454351, "4": 0.01185062464656467, "3": 0.0005833631889309748, "1": 0.00020247482502709714, "2": 0}, "score": 4.9861726906799495}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9874291249353263, "4": 0.01149926682492127, "3": 0.0005619367268977548, "1": 0.0005020263247030224, "2": 0}, "score": 4.98536864256299}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935356003162508, "4": 0.006048188338286891, "1": 0.00024801136158646993, "3": 0.00016359380520625212, "2": 0}, "score": 4.9926325446691395}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984995938365103, "4": 0.0013964597430868877, "1": 7.424604854104742e-05, "3": 2.8232577959881563e-05, "2": 0}, "score": 4.99825008833832}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.921636933897393, "4": 0.06410808448483528, "3": 0.013748845802901699, "1": 0.000473996320005885, "2": 2.8518458889805763e-05}, "score": 4.9064123443684}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9851305958296301, "4": 0.014329284050131272, "3": 0.0005006904059931447, "1": 3.663835190238923e-05, "2": 0}, "score": 4.9845227385276285}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9840570165108129, "4": 0.014822559028985875, "3": 0.001082378872957159, "1": 3.51647815628824e-05, "2": 0}, "score": 4.982871974756336}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9882132524146167, "4": 0.011504293102685461, "3": 0.00018743002166566849, "1": 8.939972069559793e-05, "2": 0}, "score": 4.987763179142261}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9971007906481558, "4": 0.0028241566215506477, "3": 6.368592356163434e-05, "1": 6.539649416315427e-06, "2": 0}, "score": 4.997022298559828}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7901301106948948, "4": 0.09197345280876318, "1": 0.0872368103587841, "3": 0.029629979774470034, "2": 0.0010146317907890718}, "score": 4.496767895019969}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9935897310012501, "4": 0.00592460832281523, "1": 0.00029147596744937064, "3": 0.00019240154300275266, "2": 0}, "score": 4.992524671391633}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9423941628724068, "4": 0.04887414277308679, "3": 0.007109445691645843, "1": 0.0015865617905252026, "2": 3.06824109740806e-05}, "score": 4.930468323480011}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9976402251565873, "4": 0.002060091870180647, "1": 0.00022812062771317818, "3": 6.853746691244063e-05, "2": 0}, "score": 4.996890341278801}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992041507561338, "4": 0.0007570365674099857, "3": 2.0607550916229565e-05, "1": 1.7252405067545858e-05, "2": 0}, "score": 4.999132737884229}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"5": 0.576568630225663, "4": 0.23945501705529704, "3": 0.18097539430929016, "1": 0.0021917970518884767, "2": 0.0008026757691217593}, "score": 4.387415005836864}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.880083420482413, "4": 0.11172734448016733, "3": 0.007947965460392373, "1": 0.00021440367243923147, "2": 1.796782319517826e-05}, "score": 4.871464062716474}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.968209354286777, "4": 0.02845733587938047, "3": 0.003192281864111515, "1": 0.00013083415881706876, "2": 6.96726364961928e-06}, "score": 4.964613747790764}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8523206186255425, "4": 0.12677487541840238, "3": 0.02056353535732787, "1": 0.0003007605875215334, "2": 3.141619605808372e-05}, "score": 4.830799275008784}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9693973482786199, "4": 0.02935282163060405, "3": 0.000973155571567987, "1": 0.00026783270699371386, "2": 0}, "score": 4.967629250182194}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9808758421153889, "4": 0.017959506396084284, "3": 0.001021179037631153, "1": 0.00013050213123920183, "2": 0}, "score": 4.979475860799051}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9741630138446845, "4": 0.024051257425320657, "3": 0.0016966365291933257, "1": 7.856698381660793e-05, "2": 0}, "score": 4.972240909410575}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9340485942516666, "4": 0.05719673286342255, "3": 0.008586732495861355, "1": 0.00015346500459861886, "2": 1.1422379647565416e-05}, "score": 4.9249814459555115}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952921561015864, "4": 0.00453817105235361, "3": 0.00013846250375527228, "1": 2.7257959166427703e-05, "2": 0}, "score": 4.995075852641352}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9857554770634187, "4": 0.013603162180433255, "3": 0.0005664920563073001, "1": 6.925369894188997e-05, "2": 0}, "score": 4.984986754611798}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"5": 0.883260680979732, "4": 0.0984900648852852, "3": 0.01620106983057322, "1": 0.0018678261704682929, "2": 0.00016560833254140013}, "score": 4.861137617581509}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9785594507163172, "4": 0.019685253044160383, "3": 0.001358997477444385, "1": 0.0003810823745647782, "2": 9.341964462019262e-06}, "score": 4.97604425588313}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9030701256981221, "4": 0.08840668411821456, "3": 0.007337904262098449, "1": 0.001101991810243491, "2": 6.11996553498653e-05}, "score": 4.892323562098247}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9431929823907724, "4": 0.05263452530175279, "3": 0.0030389233119469086, "1": 0.0010970048242754894, "2": 1.7727951201963747e-05}, "score": 4.936845235326602}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9845173538389077, "4": 0.01386583331035379, "3": 0.0010488436577485373, "1": 0.0005590398496286486, "2": 0}, "score": 4.981800157462992}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9882643661022977, "4": 0.011093470355674265, "3": 0.0005678743377926639, "1": 7.269161624142742e-05, "2": 9.000828700749062e-07}, "score": 4.98747730552052}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9948883402251744, "4": 0.004785173478904134, "3": 0.0001635100666168946, "1": 0.00016237209074888652, "2": 0}, "score": 4.994238314544011}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9951488135997028, "4": 0.004453642403350449, "3": 0.00024251645359794563, "1": 0.0001543098444372603, "2": 3.9741450807854346e-07}, "score": 4.994442891288326}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978081266702726, "4": 0.0021185296335684478, "3": 3.809006770403576e-05, "1": 3.470516620863747e-05, "2": 0}, "score": 4.997666468286335}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987935899983559, "4": 0.001157430288193819, "1": 3.4342359324721234e-05, "3": 1.4283050548823111e-05, "2": 0}, "score": 4.998676633704536}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5029573820534048, "5": 0.23527096183038254, "3": 0.1711441662815417, "4": 0.07860863700689885, "2": 0.012000794776648059}, "score": 2.5312265366490396}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9925361316483002, "4": 0.007393936548422407, "3": 5.985605269476059e-05, "1": 8.405410099231067e-06, "2": 0}, "score": 4.992452717099259}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9821565753216489, "4": 0.016513144150883917, "3": 0.0010492804871892014, "1": 0.00027015572661238024, "2": 0}, "score": 4.98030745841619}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9942401404637062, "4": 0.005527287998089269, "3": 0.000181784070694862, "1": 4.5720855842412276e-05, "2": 0}, "score": 4.993926229663717}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9637181457984958, "4": 0.03505399121305534, "3": 0.0010796493138215707, "1": 0.00013961038210802756, "2": 0}, "score": 4.96222794366682}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9892808954688412, "4": 0.010105827917633226, "3": 0.0004888618127202772, "1": 0.00012003658339717161, "2": 0}, "score": 4.988436251494733}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9815156798484519, "4": 0.017937872843104802, "3": 0.00046614025161026884, "1": 7.732679700695517e-05, "2": 0}, "score": 4.980820482305701}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.968417478730153, "4": 0.030440753277214815, "3": 0.0010012495590312794, "1": 0.00013722618611330007, "2": 2.015192164732255e-06}, "score": 4.96700175514319}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957751486015672, "4": 0.003981351278888825, "1": 0.00014294923367511557, "3": 9.888272559108807e-05, "2": 0}, "score": 4.9952490784099295}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9930478418438571, "4": 0.006848301593538244, "3": 8.725907419976765e-05, "1": 1.4062596722202504e-05, "2": 0}, "score": 4.992920911926452}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.956221354852382, "4": 0.037558303251882225, "1": 0.0035409249523185304, "3": 0.0026201159669343253, "2": 4.1031848505101305e-05}, "score": 4.942913626541197}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9837172920864546, "4": 0.014136851634338251, "3": 0.0013086358764525564, "1": 0.0008237326784886679, "2": 9.892793452374399e-06}, "score": 4.97992119533653}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9792958431304242, "4": 0.019023110440175815, "3": 0.0012748050678768824, "1": 0.00039154190939483653, "2": 7.212196548596766e-06}, "score": 4.976839301786779}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9889607442630681, "4": 0.010268715868566706, "1": 0.0004245156440526215, "3": 0.00033554616849723205, "2": 0}, "score": 4.987361996796525}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9896168915314183, "4": 0.009750726343284475, "1": 0.0003447240210639067, "3": 0.00027888250329181696, "2": 0}, "score": 4.988312510001129}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9604490590948656, "4": 0.035052217525974615, "3": 0.0032640255959975823, "1": 0.001217493550928747, "2": 1.3927364277890253e-05}, "score": 4.953507822636754}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9620041965575595, "4": 0.03632916924227074, "3": 0.0011163598731768298, "1": 0.0005445117698166457, "2": 3.999744795519045e-06}, "score": 4.95924799285958}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918745771652293, "4": 0.007491346684133823, "3": 0.00041235072354495726, "1": 0.00021888961419340897, "2": 1.4190059027491351e-06}, "score": 4.990804123365511}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903411423282796, "4": 0.008959868754839112, "3": 0.0005083377851281866, "1": 0.00018761210460366596, "2": 0}, "score": 4.989272974656768}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962184943686019, "4": 0.003624014100291718, "3": 8.375740276009945e-05, "1": 7.196663133907506e-05, "2": 0}, "score": 4.9959205973585}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9081211265441844, "4": 0.08159631315147743, "3": 0.009440940259729034, "1": 0.0007985489418117159, "2": 3.073584484316023e-05}, "score": 4.896234123048429}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9919705278175021, "4": 0.007608233217221151, "3": 0.00029307046001220984, "1": 0.00012585362911111923, "2": 0}, "score": 4.991302191211959}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8958543186669613, "4": 0.09048972234263791, "3": 0.01218655968117318, "1": 0.001394465069462982, "2": 6.006693705486123e-05}, "score": 4.879377303871863}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9869567610186679, "4": 0.012530901065626685, "3": 0.00038793513893824926, "1": 0.00012018780462945946, "2": 0}, "score": 4.986212419323711}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8475205688436822, "4": 0.1426461344260491, "3": 0.00898692082762787, "1": 0.0008029456740838195, "2": 3.7441943424364403e-05}, "score": 4.836054933642283}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"5": 0.993410407815809, "4": 0.006119168853085806, "3": 0.00042157873534306165, "1": 4.7222267856670136e-05, "2": 0}, "score": 4.992848773003166}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9917866216277325, "4": 0.008023456218486463, "3": 9.884278503848418e-05, "1": 7.938905861700288e-05, "2": 0}, "score": 4.991461202155774}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9946979318455529, "4": 0.005011533113592409, "3": 0.00017531363291638303, "1": 0.00011115710466318863, "2": 0}, "score": 4.994193187601276}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9916462868076796, "4": 0.008064061025785708, "3": 0.00017861641222265115, "1": 0.00010598510421505653, "2": 0}, "score": 4.9911547210585}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9805861057465988, "4": 0.017668639332526274, "3": 0.0010193073000385926, "1": 0.0007136777700095142, "2": 0}, "score": 4.977437758152017}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8670260122989942, "4": 0.10753305395770223, "3": 0.02433513471155253, "1": 0.0008968011534705734, "2": 0.0001831218096593734}, "score": 4.839655957502886}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9770753100031571, "4": 0.021186620606516354, "3": 0.0013986007590127449, "1": 0.0003312040192864774, "2": 7.096988633605974e-06}, "score": 4.974670041256559}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9976657316514583, "4": 0.002176876995855715, "3": 0.0001019793720434876, "1": 5.483395166089772e-05, "2": 3.755125290452236e-07}, "score": 4.997398701389021}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903496800960696, "4": 0.009237989533109186, "3": 0.0003357190192792641, "1": 7.483745971594278e-05, "2": 9.07259790054416e-07}, "score": 4.989788491960479}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.914550556010172, "4": 0.07741024057250234, "3": 0.0072488822095159704, "1": 0.0006930676115286342, "2": 4.642372104254879e-05}, "score": 4.905175633488504}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9839843013202347, "4": 0.012650005867180247, "3": 0.002522171606348295, "1": 0.0008309848452816221, "2": 8.711060656015e-06}, "score": 4.978955497855488}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9901797080935983, "4": 0.008878039707567863, "3": 0.0004633023468714004, "1": 0.0004631769015819264, "2": 0}, "score": 4.9883424641186265}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9916301097179326, "4": 0.007005063740138128, "3": 0.0007741200446141804, "1": 0.0005805349801415688, "2": 0}, "score": 4.989124445629178}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931117954890013, "4": 0.0063014677281270515, "3": 0.0003620062793565993, "1": 0.0002180516710708456, "2": 0}, "score": 4.9921022602811975}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9931890523624943, "4": 0.006281739163367502, "1": 0.0003282736495513873, "3": 0.00019369283082136673, "2": 0}, "score": 4.992017722769183}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9680128296720023, "4": 0.02739250618206955, "3": 0.004221995902787455, "1": 0.0003557513593213235, "2": 1.3749143867115104e-05}, "score": 4.962699130984015}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9564292599733947, "4": 0.03514661383761286, "3": 0.007539714216511596, "1": 0.0008441460781228809, "2": 3.290299075227591e-05}, "score": 4.946298269043948}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9474947973159978, "4": 0.0424937870838658, "3": 0.009342003894701354, "1": 0.0006406056506224932, "2": 2.313175983714991e-05}, "score": 4.936190025168111}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9684218317765034, "4": 0.028852979955799867, "3": 0.0023841013931493148, "1": 0.0003251132418054218, "2": 9.87347193411306e-06}, "score": 4.965048530665296}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9745934347000972, "4": 0.022049662132407232, "3": 0.002293157706741992, "1": 0.0010355645935312607, "2": 1.2846591946125008e-05}, "score": 4.969182751743977}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.878869901188794, "4": 0.08433228582898886, "3": 0.033492190055580504, "1": 0.0030810537927811873, "2": 0.00021272208701243506}, "score": 4.835719006383062}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9360067368884984, "4": 0.056498465527718006, "3": 0.006787685258666825, "1": 0.0006641158173353957, "2": 3.7742604830109945e-05}, "score": 4.927156090156284}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.977722051754501, "4": 0.02091862643340571, "3": 0.0011860941465267828, "1": 0.0001639113213269451, "2": 0}, "score": 4.976053316892689}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9853548469244746, "4": 0.014140951915824285, "3": 0.00032494195226574844, "1": 0.0001687964511527541, "2": 0}, "score": 4.984533816556125}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9930184563048218, "4": 0.0062943775275814745, "3": 0.00038029195408944557, "1": 0.00030430410840070213, "2": 1.2672986121278005e-06}, "score": 4.991724009452787}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9516149597961409, "4": 0.04509689869119094, "3": 0.003183910884271137, "1": 9.63768047429331e-05, "2": 5.394255321575442e-06}, "score": 4.948133461986037}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9975293022104506, "4": 0.0022041176696130237, "3": 0.00018473983868506726, "1": 8.006482010934611e-05, "2": 0}, "score": 4.99710613823464}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9351582852348401, "4": 0.0610127268307949, "3": 0.0034169350976023575, "1": 0.0003720126867894313, "2": 0}, "score": 4.930662575945984}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.985398141411492, "4": 0.013589885176116444, "3": 0.000787803393398668, "1": 0.00021520252424121837, "2": 0}, "score": 4.983973554223053}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9979027342416332, "4": 0.001758071164786625, "1": 0.00024798135402721193, "3": 8.995077335454199e-05, "2": 0}, "score": 4.997070098173493}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9854983851505394, "4": 0.013897262509550815, "3": 0.0005365211363132133, "1": 6.432359771719279e-05, "2": 0}, "score": 4.984772347414351}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9951197851341386, "4": 0.004761326371878875, "3": 6.326609476746968e-05, "1": 4.9875832059308524e-05, "2": 0}, "score": 4.994912608875314}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9971492658813954, "4": 0.002754264062531586, "3": 7.807013254986258e-05, "1": 1.7217512904995553e-05, "2": 0}, "score": 4.997020722098019}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993629409383474, "4": 0.0006244095966790265, "3": 5.49101740467204e-06, "1": 4.516067341634779e-06, "2": 0}, "score": 4.999346542372463}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9906249900110246, "4": 0.008978450155836882, "3": 0.0003683675651279303, "1": 2.671776120618092e-05, "2": 7.251357197182624e-07}, "score": 4.990175760899922}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9801021627959199, "4": 0.017855987371941936, "3": 0.0018487134763434986, "1": 0.0001857520199245424, "2": 4.74188415587749e-06}, "score": 4.97768929298824}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9102652303635987, "4": 0.0800622917837433, "3": 0.009190164894106945, "1": 0.00042877253547103937, "2": 3.411289816102952e-05}, "score": 4.899738001749207}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9805417440540799, "4": 0.018172787429536222, "3": 0.00125910138369704, "1": 2.3883899192525e-05, "2": 0}, "score": 4.979213422588375}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9291876492354852, "4": 0.05761354976321088, "3": 0.012239701370874002, "1": 0.0008903445814505157, "2": 5.4681889013842984e-05}, "score": 4.914180415749459}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9846799711382334, "4": 0.01441770519816432, "3": 0.0007809940707678101, "1": 0.00011594924566221774, "2": 3.0877650918111272e-06}, "score": 4.983547208663001}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6557777258503258, "4": 0.237935416828099, "3": 0.09574447068538022, "1": 0.01004176182033842, "2": 0.0004948713639380904}, "score": 4.528921270099149}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9058914431870287, "4": 0.08679113446779661, "3": 0.0071785088395854, "1": 0.0001221868655778265, "2": 1.3786302930010435e-05}, "score": 4.898321442512698}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9788834182741128, "4": 0.019410451905022205, "3": 0.001159921672326694, "1": 0.0005398691298001196, "2": 4.356933821284416e-06}, "score": 4.976097110052102}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9804858184895527, "4": 0.01854531838404562, "3": 0.0007114606839053571, "1": 0.00025227822803409366, "2": 0}, "score": 4.979022539843003}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9751263613472778, "4": 0.023106026685627206, "3": 0.0012866061743919707, "1": 0.00046416289524935187, "2": 8.682257347730232e-06}, "score": 4.972437837687661}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9592987597776967, "4": 0.03558968963733594, "3": 0.004234262966110745, "1": 0.0008172988831130654, "2": 3.344480800598015e-05}, "score": 4.9525709955219055}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9837875556195461, "4": 0.015203357307893557, "3": 0.0005814160293256464, "1": 0.00041338289002433234, "2": 0}, "score": 4.981980021601146}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9922868680501582, "4": 0.007272511400342975, "3": 0.0003214378003607069, "1": 0.00011654792455231574, "2": 1.2444050671112103e-06}, "score": 4.991614676426407}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979187637817852, "4": 0.00193783869827831, "1": 7.182883937144222e-05, "3": 7.054067952612315e-05, "2": 0}, "score": 4.997633762152688}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9893330517324773, "4": 0.010111508989154501, "3": 0.00042624596316160685, "1": 0.0001254810257582452, "2": 1.976329937812088e-06}, "score": 4.988528126076967}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9299365880983604, "4": 0.06193350310958621, "3": 0.0075226485667804575, "1": 0.0005660759508401965, "2": 3.213920286251424e-05}, "score": 4.920659760706762}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.878917247185624, "4": 0.10593816543868297, "3": 0.01394918772512026, "1": 0.0009706794187049737, "2": 0.00016520374956669755}, "score": 4.8617769036350875}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9835972239307195, "4": 0.01538065850733021, "3": 0.000897403826900814, "1": 0.00011877245953578202, "2": 3.774211768922845e-06}, "score": 4.9823380830909185}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9904551530013203, "4": 0.00899949332907576, "3": 0.0003996848085898219, "1": 0.00014166336271382335, "2": 0}, "score": 4.9896344420836645}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987076233389405, "4": 0.001088295030030664, "1": 0.00016987749471643554, "3": 3.320882181563591e-05, "2": 0}, "score": 4.998165775521842}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.989966801751607, "4": 0.009391330523560752, "3": 0.0005845048379570044, "1": 5.088903907170262e-05, "2": 0}, "score": 4.989236033959959}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994123026370406, "4": 0.005608413488876075, "3": 0.00022487879270482645, "1": 3.9662277932464065e-05, "2": 0}, "score": 4.993783154828048}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9964215499678091, "4": 0.003454239367929837, "3": 0.00011453615736183415, "1": 8.17403410871973e-06, "2": 0}, "score": 4.9962839866051345}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996026565818134, "4": 0.00038628427338734524, "1": 5.511093484234051e-06, "3": 4.084762381040936e-06, "2": 0}, "score": 4.9995835012184555}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9671536980347224, "4": 0.03132475185059806, "3": 0.0011412535676159543, "1": 0.0003677469839043913, "2": 0}, "score": 4.964921312856354}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6734099679124004, "4": 0.2359184227562418, "3": 0.08873896467924362, "1": 0.0016367028796983355, "2": 0.00029274313669911116}, "score": 4.579177260897737}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9884958714113153, "4": 0.011139836738736954, "3": 0.0003389314443808169, "1": 2.4763296026623926e-05, "2": 2.212083100424607e-07}, "score": 4.9880825790836925}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9493842741403975, "4": 0.04624368337623404, "3": 0.0033379728079032, "1": 0.001018012583426945, "2": 1.1598288660531416e-05}, "score": 4.9429732715373005}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9847087517850281, "4": 0.014953607558421152, "3": 0.0003302416165654563, "1": 6.800394042735502e-06, "2": 0}, "score": 4.984358698268675}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9911417564870121, "4": 0.008653180826724147, "3": 0.00019474101701549265, "1": 9.218492841247234e-06, "2": 0}, "score": 4.990920453151538}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9386128735709244, "4": 0.056123593127752364, "3": 0.004085690221792722, "1": 0.0011504540367045834, "2": 2.3506725177247277e-05}, "score": 4.931032422352269}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9728325005945836, "4": 0.025692172640198737, "3": 0.0012444143018977068, "1": 0.00022508667673691788, "2": 4.485650652295483e-06}, "score": 4.970905156106056}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9219667490619449, "4": 0.06927713981539503, "3": 0.008222092831068091, "1": 0.0005040029685147666, "2": 2.50892020901191e-05}, "score": 4.912186962464492}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903570488202778, "4": 0.008947393662494219, "3": 0.0003731285349348648, "1": 0.00031946143361269983, "2": 0}, "score": 4.989028470974639}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9767276297967882, "4": 0.02234449269821252, "3": 0.0007915353639360987, "1": 0.00013194373186610644, "2": 2.7004422555921947e-06}, "score": 4.975536518781501}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9091601024552268, "4": 0.08433278339094302, "3": 0.006201944543848596, "1": 0.0002790878363675425, "2": 1.651163952493333e-05}, "score": 4.902096504307734}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9657483093940518, "4": 0.031887646539796, "3": 0.002153193263245191, "1": 0.00020600214018110405, "2": 3.0093934835173975e-06}, "score": 4.9629728620896625}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9449841349897079, "4": 0.051525018147397475, "3": 0.0027504437958911676, "1": 0.0007172756802351965, "2": 1.610291896875515e-05}, "score": 4.940056261710112}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.883856676628334, "4": 0.10671779057894906, "3": 0.007516246509533198, "1": 0.0018645666726270402, "2": 3.2665372045740244e-05}, "score": 4.870691894884599}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9054475202427593, "4": 0.08391156771357919, "3": 0.008967165057197737, "1": 0.0015511397433107545, "2": 6.910945540573742e-05}, "score": 4.8917364229707}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9860530180335492, "4": 0.012985880852643997, "3": 0.0005451797506350137, "1": 0.0004085699590266815, "2": 0}, "score": 4.984289364314748}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9747950258335536, "4": 0.023065686470107625, "3": 0.001968553243882235, "1": 0.0001590752813793337, "2": 5.429584208340109e-06}, "score": 4.972344444881303}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9968018667578997, "4": 0.0028851453471398763, "3": 0.0002332404878477011, "1": 7.897067317906357e-05, "2": 4.343631072478157e-07}, "score": 4.996331186639032}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9932876024624977, "4": 0.006365855812511076, "3": 0.00022195298007257096, "1": 0.00012334749786925976, "2": 5.825930044265196e-07}, "score": 4.992695095645449}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9966251622101775, "4": 0.0031063812981205275, "3": 0.00018302112035615726, "1": 8.369151161569357e-05, "2": 0}, "score": 4.996192803775488}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9940876839368232, "4": 0.005497768479911255, "3": 0.0002348012843619388, "1": 0.00017898617316416366, "2": 5.712550811416785e-07}, "score": 4.993314969230858}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9971197529933276, "4": 0.002734344343503128, "1": 7.32511214709997e-05, "3": 7.20306381211347e-05, "2": 0}, "score": 4.996828587925229}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8815776786849847, "4": 0.09808104031989585, "3": 0.015284592257265871, "1": 0.004932526241302764, "2": 0.0001019099477327868}, "score": 4.851310631639736}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9792438252961128, "4": 0.019217858539264495, "1": 0.0009079211702836591, "3": 0.00062290035237723, "2": 3.6044116659677568e-06}, "score": 4.9758937490609805}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9762886083544845, "4": 0.020884888913669606, "3": 0.0014378303543121822, "1": 0.0013742015602226279, "2": 1.174753648743266e-05}, "score": 4.970707321755164}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.845481475842008, "4": 0.13764904297704506, "3": 0.014366166292146433, "1": 0.0024344103690604377, "2": 5.3719338512604956e-05}, "score": 4.823717148059829}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9244869315036256, "4": 0.0665227489730107, "3": 0.007692618855951641, "1": 0.0012587010531129605, "2": 2.5452387702928413e-05}, "score": 4.912979673055437}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9394422320419261, "4": 0.04916071254418023, "3": 0.009603554390722616, "1": 0.0017508953382909893, "2": 3.108739892956464e-05}, "score": 4.9245344658908214}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9231860498409674, "4": 0.0739579566956051, "3": 0.0024890255263110353, "1": 0.00034159388406538194, "2": 0}, "score": 4.9196955790668735}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9804994483176495, "4": 0.018572588905624608, "3": 0.0007797969442940102, "1": 0.00014488641026890343, "2": 1.663972070934976e-06}, "score": 4.979283246181616}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9432140818537851, "4": 0.053204180760422874, "3": 0.003133251486641759, "1": 0.0004347738704866112, "2": 7.65136113353872e-06}, "score": 4.938766895587459}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9837972371205187, "4": 0.015504617441012454, "3": 0.0006493569451004389, "1": 4.651689397789368e-05, "2": 0}, "score": 4.983010562499678}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8882739067541615, "4": 0.09395404492794694, "3": 0.016484363731806694, "1": 0.0011836628951429056, "2": 7.613008775100218e-05}, "score": 4.868110507155215}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9580212304840465, "4": 0.03927586778444551, "3": 0.0023032387370779937, "1": 0.0003730634669924618, "2": 1.2174182950938477e-05}, "score": 4.954588223244053}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8840686809324204, "4": 0.09886262685417366, "3": 0.013691195732460252, "1": 0.0032264010143968256, "2": 0.0001323336728938495}, "score": 4.8604497583918}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.967078766836187, "4": 0.03179573874196667, "3": 0.0008915915801728597, "1": 0.00022910320020680635, "2": 0}, "score": 4.9655044997308275}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9307567686520426, "4": 0.06510354998466067, "3": 0.003387680872858384, "1": 0.0007404708428359255, "2": 9.733062140730726e-06}, "score": 4.925129871201273}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9604032093116536, "4": 0.03678095481405663, "3": 0.00263932150641824, "1": 0.00016934237581455515, "2": 3.2357914748922202e-06}, "score": 4.957253157035276}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.979101753199679, "4": 0.019170266885152044, "3": 0.0011412996751914532, "1": 0.0005702785684156598, "2": 0}, "score": 4.976265630207465}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.994484248426319, "4": 0.0051153062932145325, "3": 0.00022787917583976227, "1": 0.0001679554151154043, "2": 0}, "score": 4.9937570849105}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9847027455723141, "4": 0.01429966741041049, "3": 0.0008339247395709765, "1": 0.00016052770716204235, "2": 1.9053211136405812e-06}, "score": 4.983384635894033}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.94376216635501, "4": 0.05157104538190213, "3": 0.004245192978770219, "1": 0.00041344519152015875, "2": 6.0467053772203865e-06}, "score": 4.938266517928916}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9903440608679265, "4": 0.008212753730514692, "3": 0.0011047797335901686, "1": 0.00033399584673167275, "2": 3.691151828408105e-06}, "score": 4.988230621501602}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9945091306340401, "4": 0.004475807037230765, "1": 0.0007798494263943637, "3": 0.00023368745448397547, "2": 9.08468156824673e-07}, "score": 4.9919346899676205}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8774552255133061, "4": 0.11663385448449229, "3": 0.005281439953388976, "1": 0.0006152800671981016, "2": 1.2655963891711199e-05}, "score": 4.870303977195305}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9964660575253173, "4": 0.003465468313713767, "3": 5.803373955986165e-05, "1": 9.215847513424495e-06, "2": 0}, "score": 4.99638159638611}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9956707841891029, "4": 0.004286947233212061, "3": 3.8621169468532294e-05, "1": 2.5112096214769904e-06, "2": 0}, "score": 4.995625760619359}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9675105362080286, "4": 0.031492331727765235, "3": 0.0009202148339670855, "1": 7.250420483944518e-05, "2": 0}, "score": 4.966377073406114}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994926098259526, "4": 0.0004768993956059825, "1": 2.131230398814535e-05, "3": 8.540892905074684e-06, "2": 0}, "score": 4.999420769233325}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9529767874212254, "5": 0.04694460919725317, "1": 4.4131268079771606e-05, "3": 2.8045285920343913e-05, "2": 0}, "score": 4.046784470782817}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9850208209629514, "4": 0.014129553248759618, "3": 0.0006305284378049426, "1": 0.00021306612381191144, "2": 3.391087132256659e-06}, "score": 4.983746909208558}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9979155594697793, "4": 0.0020116318914882585, "3": 4.119935323135894e-05, "1": 3.1044962533284186e-05, "2": 0}, "score": 4.997781788300128}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979127080299335, "4": 0.0019654432236227383, "3": 7.733190074397913e-05, "1": 4.361170414243506e-05, "2": 0}, "score": 4.997705444081422}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996941397747786, "4": 0.0002889499697181822, "1": 9.772746653969635e-06, "3": 6.77068699379581e-06, "2": 0}, "score": 4.999658417544378}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984852138484582, "4": 0.0014069922627170622, "1": 5.756280185559128e-05, "3": 4.9129641931238834e-05, "2": 0}, "score": 4.998264495334435}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9726400651491068, "4": 0.025747374969524835, "3": 0.0013487303642203009, "1": 0.0002505582824576363, "2": 9.532857906477859e-06}, "score": 4.970524222406921}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9975631114455076, "4": 0.0023556914152929338, "3": 4.163797277336588e-05, "1": 3.890748147486926e-05, "2": 0}, "score": 4.997405401022401}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9911971519566246, "4": 0.008300761677637384, "3": 0.00037373259608591754, "1": 0.00012526726289395374, "2": 1.8271832217851132e-06}, "score": 4.990445210496379}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9862540493753128, "4": 0.013427005020242994, "3": 0.00027547656403866455, "1": 4.088901961625508e-05, "2": 0}, "score": 4.985858449287719}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9877689745541737, "4": 0.012012974559410883, "3": 0.0002017936333194685, "1": 1.4919701053769767e-05, "2": 0}, "score": 4.987523742682092}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9612367388424694, "4": 0.03646576878314166, "3": 0.0020985920741074036, "1": 0.0001896147833362869, "2": 5.352552542980862e-06}, "score": 4.9585623673049355}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9723095248593664, "4": 0.026221651928989162, "3": 0.001198429055801491, "1": 0.00025980193648569275, "2": 4.909737892331239e-06}, "score": 4.9703273843857}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9807086562689965, "4": 0.01757010501239343, "3": 0.0013341712051912064, "1": 0.0003737651122362089, "2": 6.469135985647057e-06}, "score": 4.978246936075867}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9928594263106768, "4": 0.00672069303201803, "1": 0.0002365287010240355, "3": 0.00017781391070660307, "2": 0}, "score": 4.991977519913612}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9956449013665208, "4": 0.004042911007771361, "1": 0.00020831358362284464, "3": 0.00010210202494831215, "2": 0}, "score": 4.994919621605323}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9859338814311565, "4": 0.012833607024493598, "3": 0.0009787591128501754, "1": 0.00024777288938014575, "2": 2.7701266965065103e-06}, "score": 4.984209422133672}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9557569296002876, "4": 0.04215159728488358, "3": 0.0017397822800373122, "1": 0.0003367807273722048, "2": 9.251692964476418e-06}, "score": 4.9529936941854995}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982923692633138, "4": 0.0015982547920680287, "1": 6.54899409761367e-05, "3": 4.3428832244563614e-05, "2": 0}, "score": 4.998052926889393}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9769782404390652, "4": 0.0210694680137845, "3": 0.0017295828962073793, "1": 0.0002124162000676649, "2": 5.204182129209133e-06}, "score": 4.97460595963544}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9937766582116939, "4": 0.005942612069059317, "3": 0.00014068728042881346, "1": 0.00013493289192112695, "2": 0}, "score": 4.993236247242686}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9447246779713188, "4": 0.046141879146818505, "3": 0.006143663828789491, "1": 0.0029106903274631626, "2": 7.147148492848956e-05}, "score": 4.929713082038594}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9952903911515709, "4": 0.004530853258225577, "3": 0.00010381147958946837, "1": 7.274604628408626e-05, "2": 0}, "score": 4.994970528542358}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9989645105895444, "4": 0.0010091781421730952, "3": 1.568802304679067e-05, "1": 8.609769595389984e-06, "2": 0}, "score": 4.998925004568876}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999414491636959, "4": 0.0005704192164518211, "1": 9.466417710477722e-06, "3": 4.744269923578172e-06, "2": 0}, "score": 4.99938222603017}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986507961949579, "4": 0.0012632784408682228, "1": 4.9224209129892286e-05, "3": 3.622380712160743e-05, "2": 0}, "score": 4.998467376376773}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9779190112100299, "4": 0.020353709473400598, "3": 0.0015408531845888518, "1": 0.00017515714772322659, "2": 0}, "score": 4.975863683574758}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9874420238062341, "4": 0.012119324914694399, "3": 0.0003662250949798948, "1": 4.8485634488934964e-05, "2": 0}, "score": 4.986953970028264}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9641833812022562, "4": 0.030596305885727988, "3": 0.004740256646071985, "1": 0.0004295227712075347, "2": 2.1589013649648536e-05}, "score": 4.95813911105464}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9844607447341003, "4": 0.014964807516581299, "3": 0.00036101393473586915, "1": 0.00019652301673560944, "2": 0}, "score": 4.983526793971948}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9601843276333657, "4": 0.036466158968955116, "3": 0.002843385099948235, "1": 0.0004748361788729269, "2": 1.8362445214907036e-05}, "score": 4.955892068478852}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8892210003884323, "4": 0.0986478343123303, "3": 0.01118855721702704, "1": 0.00090838750752644, "2": 3.170490998368112e-05}, "score": 4.875246072654508}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.984057363883001, "4": 0.01526198779215537, "3": 0.0005399034125783288, "1": 0.0001332629918311747, "2": 0}, "score": 4.9831250271581595}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9839471349671335, "4": 0.01578739566558077, "3": 0.00023545093739299654, "1": 2.7493058591727803e-05, "2": 0}, "score": 4.983631688889203}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972652030890398, "4": 0.002514601342306897, "1": 0.00015443519491635044, "3": 6.4156509432044e-05, "2": 0}, "score": 4.9967393396295074}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9862528855962212, "4": 0.012630244299649977, "3": 0.000565969878146331, "1": 0.000547935652695103, "2": 1.796597427542476e-06}, "score": 4.984040664900877}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9821111535946936, "4": 0.016597541450166266, "3": 0.0010140547309235351, "1": 0.0002734146638398221, "2": 2.8909337822011835e-06}, "score": 4.980271998995685}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9973482014460213, "4": 0.0025700608585133363, "3": 4.981367565930049e-05, "1": 3.0847464469059335e-05, "2": 0}, "score": 4.997206918925386}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9850988928669302, "4": 0.01415702941218588, "3": 0.0005563979958035079, "1": 0.000185853654073847, "2": 1.176496033765172e-06}, "score": 4.98398322008771}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9823808587013672, "4": 0.01574441783040004, "3": 0.0010499155989456834, "1": 0.0008214564784829152, "2": 2.701960330678977e-06}, "score": 4.9788618054489975}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9945698571160633, "4": 0.005071966838597469, "1": 0.0001827360127286633, "3": 0.00017428459350883052, "2": 0}, "score": 4.9938485128158}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9357994671088615, "4": 0.05843717695449112, "3": 0.005647443579622729, "1": 0.00010074036444239482, "2": 9.582672866904946e-06}, "score": 4.929835834239937}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9776362467217024, "4": 0.021842147591405216, "3": 0.00048539575989019814, "1": 3.2133482593523756e-05, "2": 0}, "score": 4.977058433438419}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9763672496164659, "4": 0.02271418862948431, "3": 0.0008214145031293439, "1": 8.836178307086655e-05, "2": 0}, "score": 4.975289318137073}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9753955382440174, "4": 0.023482016643439713, "3": 0.0010082612160479203, "1": 0.00010691975052316598, "2": 0}, "score": 4.974073593589171}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9671845826468782, "4": 0.03129726391854162, "3": 0.0013928939747041163, "1": 0.00011556608813460985, "2": 4.8771671924554895e-06}, "score": 4.965439885829356}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8651980835004001, "1": 0.06601173828279627, "4": 0.04844245889120507, "3": 0.019541712411491195, "2": 0.0008023737790528337}, "score": 4.646018755755803}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.990421942606377, "4": 0.008642382343262091, "1": 0.0006219328059997186, "3": 0.000310864634307298, "2": 1.630967762503321e-06}, "score": 4.988243249604374}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.978879304035752, "4": 0.019024520104886866, "3": 0.0014907239567669374, "1": 0.000582835833768855, "2": 1.2756941540009356e-05}, "score": 4.975624177497547}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981174012163238, "4": 0.0017701772432153718, "1": 6.910800412241242e-05, "3": 4.225398031328422e-05, "2": 0}, "score": 4.9978688805216285}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9911918817753785, "4": 0.00832130903988894, "3": 0.0002856549340161616, "1": 0.00019620981237079707, "2": 0}, "score": 4.990322493992763}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9837089836452924, "4": 0.015889257929436577, "3": 0.0003697032134543838, "1": 2.9422437335867187e-05, "2": 0}, "score": 4.9832536018048215}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9886701645284302, "4": 0.01072879103681601, "3": 0.0005451721181719325, "1": 5.259376402008587e-05, "2": 0}, "score": 4.987970450231248}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9925274384594077, "4": 0.006986012802537843, "3": 0.0003476877677642471, "1": 0.00013585858899269122, "2": 0}, "score": 4.991775152611835}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951320629977896, "4": 0.00474094118855446, "3": 9.862931777848885e-05, "1": 2.6885283576480824e-05, "2": 0}, "score": 4.994954251567758}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977498630621082, "4": 0.002176047763699051, "3": 6.516076721337148e-05, "1": 8.143829777162334e-06, "2": 0}, "score": 4.997661053547681}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9378491348110657, "4": 0.05148071538413736, "3": 0.009151013873373966, "1": 0.001445625758922345, "2": 6.242516990849865e-05}, "score": 4.924246638597492}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9948223872837137, "4": 0.004881751058576691, "3": 0.00019967090933228942, "1": 8.822281102400556e-05, "2": 0}, "score": 4.994365970987072}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9343032730298221, "4": 0.05042203989441552, "3": 0.01476231986108249, "1": 0.0004624653142686686, "2": 4.335476246446515e-05}, "score": 4.918072858450654}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970567078025023, "4": 0.0028299034061838963, "3": 9.416857789704959e-05, "1": 1.8133926171928874e-05, "2": 0}, "score": 4.99690922037586}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.970841715327333, "4": 0.0265826109672572, "3": 0.002338931682035783, "1": 0.00021335054368695476, "2": 0}, "score": 4.967885372285261}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9679935015527952, "4": 0.02613410794449331, "1": 0.0031428696347306773, "3": 0.0027130126027426656, "2": 1.3847234781914533e-05}, "score": 4.955826729060333}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8534525695470567, "4": 0.11556107510406796, "3": 0.026775119487675504, "1": 0.004067656271759997, "2": 0.00013448619548352744}, "score": 4.814212912811915}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9789909114483296, "4": 0.018671251332002762, "3": 0.0016942734044431407, "1": 0.0006354526362563384, "2": 6.544477458913257e-06}, "score": 4.975378719307512}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9765029555432392, "4": 0.022336584147693378, "3": 0.0007513169184065238, "1": 0.00040410314628629406, "2": 3.607354066223224e-06}, "score": 4.974533510877464}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9737836044948419, "4": 0.024581208747391357, "3": 0.0010502511005730773, "1": 0.000575212511631911, "2": 5.836656162629203e-06}, "score": 4.9709998163275415}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9362723992540407, "4": 0.05694449257993357, "3": 0.006439264200333689, "1": 0.00032629293710573974, "2": 1.5004175934103956e-05}, "score": 4.928826613475045}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9143082367936904, "4": 0.07885179508587113, "3": 0.0061010462873181725, "1": 0.0007100778116930612, "2": 2.589009745534285e-05}, "score": 4.906027853213776}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9899740344754817, "4": 0.009399999903238084, "3": 0.00036616727260259445, "1": 0.0002582470172205644, "2": 7.47090879432466e-07}, "score": 4.988832427228621}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9381221411569876, "4": 0.05604761957700468, "3": 0.005390268935699128, "1": 0.00040516571569145876, "2": 2.8340462617483092e-05}, "score": 4.931465715284945}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9813851194648788, "4": 0.018092537835509626, "3": 0.0004261040468862451, "1": 9.349421455510933e-05, "2": 0}, "score": 4.980681224193311}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8524101766577904, "4": 0.13176115858563003, "3": 0.013381622079209598, "1": 0.002405853626852349, "2": 3.496419570265797e-05}, "score": 4.831746242806223}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9680197587326361, "4": 0.029789333076599915, "3": 0.0021560606403694723, "1": 3.2302530084948534e-05, "2": 0}, "score": 4.965769248404363}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9225328167384196, "4": 0.06977826551569338, "3": 0.0067333936861072655, "1": 0.0009221656378005597, "2": 2.6860117294362357e-05}, "score": 4.912985138759926}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.94274672757305, "4": 0.05046797511507523, "3": 0.0064139030063728565, "1": 0.00034615081374430543, "2": 1.5531691632206423e-05}, "score": 4.935272391920712}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.978975138073835, "4": 0.01956343923150842, "3": 0.0013322034210742693, "1": 0.0001252767835677147, "2": 3.095686088440345e-06}, "score": 4.9772617404789585}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9856659400312693, "4": 0.01333737012478236, "3": 0.0007901055609295066, "1": 0.00020225910186449217, "2": 2.717160925937588e-06}, "score": 4.984265205561256}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954229036785952, "4": 0.004381061203656308, "3": 0.000147713052593369, "1": 4.706389083057197e-05, "2": 0}, "score": 4.995135251007133}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9921359487263877, "4": 0.007393130653260712, "3": 0.00030779179310242544, "1": 0.0001610340056605015, "2": 0}, "score": 4.991347131611677}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9899352569620592, "4": 0.009510032357115252, "3": 0.0004157065314073619, "1": 0.00013621418790961865, "2": 0}, "score": 4.9891136674559835}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962995401392367, "4": 0.003559349768850116, "3": 8.683454774410852e-05, "1": 5.2947590084140594e-05, "2": 0}, "score": 4.996055185536793}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9705693392409863, "4": 0.027739932428090128, "3": 0.0009264059763605083, "1": 0.000756508567211191, "2": 3.99969679886948e-06}, "score": 4.967369097802731}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9920089961884779, "4": 0.007579197163824376, "3": 0.00037649830979150247, "1": 3.252238293451894e-05, "2": 0}, "score": 4.991537693109249}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9620812042275141, "4": 0.032538684668388, "3": 0.004864523075047827, "1": 0.0004999107377397408, "2": 1.0617372322771204e-05}, "score": 4.955700549961961}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9916033801927656, "4": 0.007891176834897977, "1": 0.0002671968246947038, "3": 0.00023412696600270933, "2": 0}, "score": 4.9905717430976155}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9717659516499223, "4": 0.02670706878803822, "3": 0.0010054611369207593, "1": 0.0005101088620623344, "2": 0}, "score": 4.9692412225456595}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9199718971331592, "4": 0.07413400092730507, "3": 0.004984661906673777, "1": 0.0008871120135778592, "2": 1.5956121647749024e-05}, "score": 4.912299800023396}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9950805891328727, "4": 0.004307644689469144, "3": 0.00035972147734356216, "1": 0.00024874258286456893, "2": 1.8282688910306967e-06}, "score": 4.9939724483340155}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9686528695806508, "4": 0.02740947287424329, "3": 0.0035042421554686933, "1": 0.0004202255361422298, "2": 9.946697215879326e-06}, "score": 4.963871183407205}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.986383235418272, "4": 0.012685559242360636, "3": 0.0005945400360680147, "1": 0.00032891506553364485, "2": 0}, "score": 4.984809582694022}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.991961732053828, "4": 0.006874963118676754, "1": 0.0006361246647973768, "3": 0.0005232867316801251, "2": 3.1352426078487373e-06}, "score": 4.989524551088587}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9606886220807599, "4": 0.035554110625790454, "3": 0.003008162054031908, "1": 0.0007364037619865898, "2": 1.1165856083203266e-05}, "score": 4.955450384238609}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.980166403737225, "4": 0.018210944854779924, "3": 0.0013830162175673167, "1": 0.0002321933797706281, "2": 4.745451393876091e-06}, "score": 4.978079953732502}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9342231506168253, "4": 0.060316800427497534, "3": 0.00526623285665181, "1": 0.00017745242733239685, "2": 9.782338422430393e-06}, "score": 4.928411105984232}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9772039230735795, "4": 0.02200687223685604, "3": 0.0006592212129813612, "1": 0.0001251007681778338, "2": 2.663738422125247e-06}, "score": 4.976166238162802}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955322977075028, "4": 0.004336713395047445, "3": 7.895314363546908e-05, "1": 5.029781103481791e-05, "2": 0}, "score": 4.995304180912477}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9375414957347904, "4": 0.05495133519860259, "3": 0.005956302954643891, "1": 0.001518701478042158, "2": 2.6041269236777946e-05}, "score": 4.926982682060564}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.980828599368186, "4": 0.017937209154087932, "3": 0.0009888419964745418, "1": 0.00024065721051509832, "2": 2.5545052320698237e-06}, "score": 4.979114769847482}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9539279294857361, "4": 0.04456426385464684, "3": 0.0011501521971684315, "1": 0.0003338101966563936, "2": 0}, "score": 4.951799041647928}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.994333952341323, "4": 0.005470873423863596, "3": 0.00010184189461997163, "1": 9.182022212599708e-05, "2": 0}, "score": 4.993958152762407}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916252988361254, "4": 0.007973840760993197, "3": 0.00020850219274877972, "1": 0.00019035382134045034, "2": 0}, "score": 4.990847721223422}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9954125128117642, "4": 0.004452179622095923, "3": 7.984542339292396e-05, "1": 5.31143192683032e-05, "2": 0}, "score": 4.995175660927349}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9966635339145531, "4": 0.003297016204440537, "3": 3.103959221931147e-05, "1": 6.5605081245324385e-06, "2": 0}, "score": 4.9966146563164795}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9954844528781397, "4": 0.004385445771754457, "3": 9.85749879936232e-05, "1": 2.9576305708874342e-05, "2": 0}, "score": 4.995299089862383}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987028687030052, "4": 0.0012596458108946721, "1": 2.133291228730625e-05, "3": 1.5248597901849525e-05, "2": 0}, "score": 4.998624524100755}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970711714114228, "4": 0.002774642691205378, "3": 8.635084220774369e-05, "1": 6.675275420747114e-05, "2": 0}, "score": 4.996785641128644}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9957500872480006, "4": 0.004033608073381985, "3": 0.00011792709068655905, "1": 9.775140361198482e-05, "2": 3.86459021159722e-07}, "score": 4.995338371636223}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9911842684597736, "4": 0.008045808551364959, "3": 0.0005107108393704909, "1": 0.0002572811762800756, "2": 1.4181093743514108e-06}, "score": 4.989899385556411}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9840113071399701, "4": 0.015180910933813378, "3": 0.0007064550368315788, "1": 9.946895226810922e-05, "2": 1.3019492414490596e-06}, "score": 4.983004387886374}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9910926862733915, "4": 0.00848772310618331, "1": 0.00027620671643404575, "3": 0.000141606567093658, "2": 8.808380967784847e-07}, "score": 4.990121585523616}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9950179193387828, "4": 0.004491565384566458, "1": 0.00030644140359514343, "3": 0.00017957618699528498, "2": 0}, "score": 4.993923489296826}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9628429447966242, "4": 0.03517478810579397, "3": 0.0015919016040043163, "1": 0.0003802216065852841, "2": 7.759241293540908e-06}, "score": 4.960097149381814}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9767695958009306, "4": 0.022065751022871654, "3": 0.00080557842354962, "1": 0.0003483738058290398, "2": 5.8683679215407945e-06}, "score": 4.974911870562582}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9865609444189019, "4": 0.013030167929707473, "3": 0.00022894128148927132, "1": 0.00016827904067917034, "2": 0}, "score": 4.985838668119675}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969878616191302, "4": 0.0029393914760218734, "1": 4.07001003466137e-05, "3": 3.1167458632254965e-05, "2": 0}, "score": 4.99683547042261}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970170098826395, "4": 0.002886655538807222, "3": 6.0012180980832236e-05, "1": 3.5391106436343755e-05, "2": 0}, "score": 4.996851752741552}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9769137229264583, "4": 0.021739834717692755, "3": 0.0012034690713393949, "1": 0.00013690901183080703, "2": 3.217699161293174e-06}, "score": 4.975295867672691}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9909022066547931, "4": 0.008592152433876855, "3": 0.00031852264072490516, "1": 0.0001843065783904714, "2": 0}, "score": 4.990033547948515}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.988918070044247, "4": 0.009331680149529302, "3": 0.001598555292215067, "1": 0.00014625629939406243, "2": 2.967825583657369e-06}, "score": 4.986877248173411}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9881807723552165, "4": 0.010969056672065597, "3": 0.0007085272769486241, "1": 0.00013952203670042454, "2": 1.2906339838099118e-06}, "score": 4.987051917965103}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9859346948269442, "4": 0.01264617602527099, "3": 0.0010027947771104415, "1": 0.00040695554684412074, "2": 5.0851298138951405e-06}, "score": 4.983705086878318}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9687902313901148, "4": 0.028698061558880876, "3": 0.0016493137280224515, "1": 0.0008529707515345842, "2": 8.491830281630751e-06}, "score": 4.964565919508133}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9910998350507196, "4": 0.008108203111125438, "3": 0.0006277792286743477, "1": 0.00015963589375820735, "2": 0}, "score": 4.9899976493786475}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9690537898024361, "4": 0.028393847346905345, "3": 0.002283130617441285, "1": 0.00025652344346643185, "2": 7.551797073848767e-06}, "score": 4.96599096686879}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9837029850061999, "4": 0.01433682323617374, "3": 0.0011368849007372009, "1": 0.0008111488352769316, "2": 6.327919808921283e-06}, "score": 4.980125711992696}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9866624766299423, "4": 0.01262443193601696, "3": 0.0005949399987146362, "1": 0.00011370342892622809, "2": 2.3574524318793737e-06}, "score": 4.985723772148328}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9426461946517464, "4": 0.05481116855749731, "3": 0.00214028988252137, "1": 0.0003780194154648992, "2": 1.1525057268807293e-05}, "score": 4.939360822514636}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9479516785688664, "4": 0.049343393123912546, "3": 0.0020937082560470795, "1": 0.0005896402221676654, "2": 1.046167477302707e-05}, "score": 4.944078622708506}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8544235482516935, "4": 0.11701880858121709, "3": 0.024495819711740016, "1": 0.0037764834748681346, "2": 0.00020846362341089532}, "score": 4.818244254506008}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.947595628444641, "4": 0.0489720084609161, "3": 0.00294372645068161, "1": 0.00046268596284407634, "2": 0}, "score": 4.943288323079711}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9292135925168185, "4": 0.06448636325089724, "3": 0.005670917827523187, "1": 0.0005890603015567852, "2": 2.6029709479692797e-05}, "score": 4.921736372220296}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9857114482925821, "4": 0.013626424410598824, "3": 0.0005901265810047206, "1": 6.523117885740569e-05, "2": 0}, "score": 4.984932295710582}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9469145738431238, "4": 0.04507213376704899, "3": 0.00771122669232271, "1": 0.00026788842199092753, "2": 3.125753783964148e-05}, "score": 4.938339906515526}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9954695701981744, "4": 0.004282128842242658, "3": 0.00018812047046753094, "1": 5.5955266441238005e-05, "2": 0}, "score": 4.995117788522627}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9919320520108736, "4": 0.0076745087045058105, "3": 0.00020000303830632562, "1": 0.00018949593213088165, "2": 0}, "score": 4.9911674666874015}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951072695913051, "4": 0.004709227015628779, "3": 0.00012683075475298215, "1": 5.439915158978517e-05, "2": 0}, "score": 4.9948195030907145}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9714751514507374, "4": 0.02686529967540974, "3": 0.0011305308249116232, "1": 0.0005201430958074213, "2": 4.36553853747502e-06}, "score": 4.968779828891232}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9823371447081575, "4": 0.017010125407952267, "3": 0.0005645847798001549, "1": 8.183954466976936e-05, "2": 0}, "score": 4.981533230410455}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9860549921136674, "4": 0.012780457916022048, "3": 0.0008482285007823767, "1": 0.0003102640031021375, "2": 2.983280571597666e-06}, "score": 4.984273030880663}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9940053414975615, "4": 0.005847696827273523, "3": 8.167684591482967e-05, "1": 6.09821719270039e-05, "2": 0}, "score": 4.993744993880041}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9853950098211746, "4": 0.013776886256450904, "3": 0.0007272019017039371, "1": 9.594178084428869e-05, "2": 0}, "score": 4.984384865361952}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9701807253939877, "4": 0.02776751407598794, "3": 0.0018777036715934047, "1": 0.0001688731021400349, "2": 4.383850983001247e-06}, "score": 4.967788408853092}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9727757617936478, "4": 0.02590624550906306, "3": 0.0011698309825110503, "1": 0.00014303388467567504, "2": 4.099145584481369e-06}, "score": 4.9711696298931045}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.971660586836815, "4": 0.02631318854239276, "3": 0.0019247407416015867, "1": 9.760059190140902e-05, "2": 2.6588097439322205e-06}, "score": 4.9694389137562025}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9679586563499089, "4": 0.030167225266326817, "3": 0.0016937538504676723, "1": 0.00017544902729650102, "2": 3.618080215535281e-06}, "score": 4.965732572223461}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9958164080055213, "4": 0.003970405692330998, "3": 0.00015068123183519566, "1": 6.123185483630179e-05, "2": 0}, "score": 4.9954832986739195}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7909831607499004, "4": 0.16285077309310886, "3": 0.04348777564656963, "1": 0.002560920281830272, "2": 0.00011333143263845172}, "score": 4.739588948441415}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994029256162146, "4": 0.005348957483284221, "1": 0.0004691237336030358, "3": 0.00015050082380544394, "2": 0}, "score": 4.99247352966399}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.986796537647494, "4": 0.012486595126191949, "3": 0.0005192734162147567, "1": 0.00019481639637404272, "2": 0}, "score": 4.985695552726514}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.993146489760405, "4": 0.006280175833054264, "1": 0.00031135930223263317, "3": 0.0002598880751043253, "2": 0}, "score": 4.991954594016809}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9965902407773384, "4": 0.0030857825219405134, "1": 0.0001734710207336084, "3": 0.00014951796576687088, "2": 0}, "score": 4.995921293434995}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"5": 0.906662285990501, "4": 0.07983061511841903, "3": 0.013071808377185133, "1": 0.000353702639231826, "2": 7.395764451840768e-05}, "score": 4.892388263534413}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9545684742926918, "4": 0.04136451877645292, "3": 0.003354082561675224, "1": 0.0006966227095527153, "2": 1.1190593484554301e-05}, "score": 4.949106993364009}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9885432837758065, "4": 0.010126492190590405, "3": 0.001015953193781254, "1": 0.0003084857212903597, "2": 3.835871116182863e-06}, "score": 4.986596124795868}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972787187170169, "4": 0.0025369738648866025, "1": 0.00010824947943584302, "3": 7.379954438661551e-05, "2": 0}, "score": 4.996882422087877}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9863059937851973, "4": 0.012724647732918141, "3": 0.0007781785199638887, "1": 0.00018517189539399753, "2": 0}, "score": 4.984978217393707}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9848707063643478, "4": 0.014037738062824105, "3": 0.000976589947260175, "1": 0.00011074281798895517, "2": 0}, "score": 4.983566041373255}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9737580585908486, "4": 0.025262972318491478, "3": 0.0008432458546121747, "1": 0.00012639097236058952, "2": 0}, "score": 4.97254471586289}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9920932421615187, "4": 0.0075930646072215145, "3": 0.0002749190135093224, "1": 3.685541511210774e-05, "2": 0}, "score": 4.991709659797785}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9950131969949437, "4": 0.004901740170867542, "3": 4.343052600204925e-05, "1": 3.980197594686872e-05, "2": 0}, "score": 4.994852181451123}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990145970286922, "4": 0.0009637732585429894, "1": 1.1677600947404235e-05, "3": 9.334825259495937e-06, "2": 0}, "score": 4.998970846051865}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9280534229674928, "4": 0.06791373378469118, "3": 0.0034086123704220052, "1": 0.0006013805073841858, "2": 1.7446735572942843e-05}, "score": 4.922810762135786}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9689165650287953, "4": 0.02897909995573345, "3": 0.0013329816550943922, "1": 0.0007501720333027267, "2": 1.0122336918122062e-05}, "score": 4.965323498103019}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9817469129155584, "4": 0.017290293574363486, "3": 0.0004939870281138345, "1": 0.0004609333972117443, "2": 0}, "score": 4.979877840357094}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9870624292788139, "4": 0.011856334467556899, "1": 0.0006575570694739789, "3": 0.0004151999693219508, "2": 0}, "score": 4.984682907438985}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9906775222658227, "4": 0.00818500546888356, "1": 0.0007490020780637266, "3": 0.0003808663621037197, "2": 0}, "score": 4.988057162683408}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9753445049337595, "4": 0.022619853158090585, "3": 0.0013698336087298992, "1": 0.0006253487899297589, "2": 2.066894966556023e-05}, "score": 4.972076524994531}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9953268844413642, "4": 0.00426597294909385, "3": 0.00021025793900301726, "1": 0.00019354838985275404, "2": 1.6808179635041673e-06}, "score": 4.99453426611128}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9910078048020137, "4": 0.007720539762247398, "3": 0.00079655426628971, "1": 0.0004692638817923531, "2": 3.953663264874994e-06}, "score": 4.988797414086744}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.994960557512711, "4": 0.004600056467587185, "3": 0.0002556336993651414, "1": 0.00018122503711077582, "2": 1.7086277414458925e-06}, "score": 4.994158645319958}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976072385283723, "4": 0.002252121991226993, "1": 8.215026398788805e-05, "3": 5.6880897145128184e-05, "2": 0}, "score": 4.997305510824933}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9199525282487339, "4": 0.0776907248526203, "3": 0.002265330759554947, "1": 8.67193947201815e-05, "2": 2.9749896439439006e-06}, "score": 4.917422668902547}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9714047259409725, "4": 0.027080082077927125, "3": 0.0008502005458622296, "1": 0.0006588657908293981, "2": 3.3476933551121597e-06}, "score": 4.968573923286862}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.975311613945614, "4": 0.02329460710316648, "3": 0.0013096601538073434, "1": 8.048699012134905e-05, "2": 1.925160917907702e-06}, "score": 4.973758304360686}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952763384471586, "4": 0.004555224786917209, "3": 0.0001123783786245478, "1": 5.4703930256127597e-05, "2": 0}, "score": 4.995001195964144}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9449531589174636, "4": 0.05141020424795168, "3": 0.0032104408975832314, "1": 0.0004155980461606051, "2": 7.34671708222054e-06}, "score": 4.94048428812507}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9709953359979799, "4": 0.027331751336333622, "3": 0.0011402280417016357, "1": 0.0005239017454020049, "2": 4.438819922799535e-06}, "score": 4.968278731339835}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9814987979239435, "4": 0.01782392541094506, "3": 0.0006072870373567341, "1": 6.576715555182788e-05, "2": 0}, "score": 4.980698350391456}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9617312146570697, "4": 0.03571939358577309, "3": 0.0022203727317642538, "1": 0.0003180289950303362, "2": 7.331627749049372e-06}, "score": 4.9585455984304385}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931092061519925, "4": 0.006647578672611632, "1": 0.00014012985913889304, "3": 9.919102713823813e-05, "2": 0}, "score": 4.9925934909934675}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963863978320174, "4": 0.0034128085669823545, "1": 9.910714701557383e-05, "3": 9.841394957303675e-05, "2": 0}, "score": 4.995993921835901}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9707329551099202, "4": 0.025197945892233925, "3": 0.00340604562960767, "1": 0.0006483414962773158, "2": 1.0753008307296644e-05}, "score": 4.9653642007201135}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.990391422234054, "4": 0.008856711905559669, "3": 0.0006425290038723526, "1": 0.0001052487459960082, "2": 2.137740773299254e-06}, "score": 4.989430801266546}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9712479480425644, "4": 0.026696294659608835, "3": 0.001761461529582418, "1": 0.00028095360753524576, "2": 8.520419340207657e-06}, "score": 4.968631255341092}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9906378602945, "4": 0.008908427857835969, "3": 0.0003609713376048503, "1": 8.882219460058226e-05, "2": 0}, "score": 4.990014301561435}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.996016343894045, "4": 0.003812576773270806, "3": 0.00012171801998901407, "1": 4.684276454253582e-05, "2": 0}, "score": 4.995756605441387}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9769040515284748, "4": 0.020667077577924853, "3": 0.001306545693028219, "1": 0.0011097705463792814, "2": 8.92333323607009e-06}, "score": 4.972253878095719}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9703991182486693, "4": 0.024269569435662105, "3": 0.0032701579254320293, "1": 0.0020377113258887745, "2": 2.0947232930691758e-05}, "score": 4.960976330314627}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.994037855844649, "4": 0.005352984623909071, "3": 0.00030810682521822225, "1": 0.000298466159520154, "2": 1.7256081825928001e-06}, "score": 4.992831754091607}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987877633531854, "4": 0.0011150277349330504, "1": 5.301402800997945e-05, "3": 4.392640227930015e-05, "2": 0}, "score": 4.998585062968583}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9797848316157667, "4": 0.017376718255811652, "3": 0.001485738981299141, "1": 0.0013414569225759186, "2": 9.150427119861735e-06}, "score": 4.974258470654963}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9243718160115778, "4": 0.060515121683174196, "3": 0.014175856612177958, "1": 0.0009060029462454836, "2": 2.8863174907915386e-05}, "score": 4.907422347190688}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7438179685589671, "4": 0.17136044078693013, "3": 0.076714127186571, "1": 0.007412125786850815, "2": 0.00065633974442422}, "score": 4.643579882810241}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6720201659870132, "4": 0.24521102809839587, "3": 0.07980631039669715, "1": 0.0023506803078943536, "2": 0.00044945446977769587}, "score": 4.584357782489196}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7841928160738725, "4": 0.17974530541928724, "3": 0.0348423910466488, "1": 0.0010843419214597873, "2": 0.0001121537343205026}, "score": 4.74589024115674}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6529259668648547, "4": 0.23011801337963392, "3": 0.10525046377668956, "1": 0.010906372800479569, "2": 0.0007805857176624441}, "score": 4.513404761276262}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9842813559074994, "4": 0.01446700557463795, "3": 0.0008764499126141868, "1": 0.0003693856269991874, "2": 2.9519724025482966e-06}, "score": 4.98229364569401}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9778266716555549, "4": 0.02031077795674682, "3": 0.0015037287832527883, "1": 0.000336871299886724, "2": 0}, "score": 4.975333737845235}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9884588331649294, "4": 0.011064948055248434, "3": 0.00032480290686801657, "1": 0.0001462675615627036, "2": 0}, "score": 4.987700312562144}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9848800794234619, "4": 0.01471176154513036, "3": 0.0003661726919183317, "1": 3.716775402061944e-05, "2": 0}, "score": 4.984407146919456}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9898831501214153, "4": 0.009703748740884022, "3": 0.0002378457984373115, "1": 0.00017213818543757451, "2": 0}, "score": 4.989131973043179}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9225110175455186, "4": 0.06864242466862283, "3": 0.008304882368122758, "1": 0.0005026989881995079, "2": 3.0879871317369865e-05}, "score": 4.912643667742752}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.95452340254258, "4": 0.04062695972951373, "3": 0.004103095459547579, "1": 0.0007031593643665588, "2": 2.399600979453157e-05}, "score": 4.948281221198049}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9709718440210043, "4": 0.027745827790091125, "3": 0.000980131315370697, "1": 0.0002925005532035394, "2": 0}, "score": 4.9691236079789665}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9741909542147615, "4": 0.024579254618973572, "3": 0.000893433189574402, "1": 0.0003251381139197663, "2": 0}, "score": 4.972333016126437}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9811946874029464, "4": 0.017760585049221813, "3": 0.0007738602935158805, "1": 0.00025958275615840803, "2": 0}, "score": 4.979653133734937}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9678094657331512, "4": 0.03052149773145915, "3": 0.00160319622779304, "1": 6.0901911269819707e-05, "2": 0}, "score": 4.966028334402326}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9848771878197936, "4": 0.014621079356377641, "3": 0.00037669828348231815, "1": 0.00012248083367702366, "2": 0}, "score": 4.9841355602288235}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9783615482748244, "4": 0.020918059546310718, "3": 0.000632725423542874, "1": 8.370034153593914e-05, "2": 0}, "score": 4.9774815989231636}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.986724687660276, "4": 0.01291205897510775, "3": 0.00029892435795720793, "1": 6.17529691630513e-05, "2": 0}, "score": 4.986243044993894}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9940604681767706, "4": 0.005708349222512455, "3": 0.00016342637089072093, "1": 6.655239671650223e-05, "2": 0}, "score": 4.993698580862982}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9897120556877984, "4": 0.00964894206703651, "1": 0.0003298736023690278, "3": 0.00030541684791059794, "2": 1.974986490278303e-06}, "score": 4.9884147847468965}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9656375859378725, "4": 0.0324672334422708, "3": 0.001444922488547613, "1": 0.0004395151370094232, "2": 7.351229351633965e-06}, "score": 4.962862681383486}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9343688260470309, "4": 0.061090598215785955, "3": 0.0032309276010147716, "1": 0.0012348620691971775, "2": 2.5710373740925757e-05}, "score": 4.927427405633795}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9521632479047997, "4": 0.045319539679045846, "1": 0.00129657474925051, "3": 0.0011885030558323728, "2": 0}, "score": 4.947115455788028}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9811679413814991, "4": 0.017866037763448583, "3": 0.000546738736195271, "1": 0.00041342559468252955, "2": 3.2983210225839314e-06}, "score": 4.979376834664116}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9655833302174683, "4": 0.029913099026174395, "3": 0.0042234328924831005, "1": 0.00025901126577757445, "2": 1.693484879982201e-05}, "score": 4.9605530202275006}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995064232091205, "4": 0.0002674872918124219, "1": 5.464674494269251e-06, "3": 3.600412988694987e-06, "2": 0}, "score": 4.999703388812364}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9913776644018679, "4": 0.007576541120717204, "3": 0.0008111772259830011, "1": 0.00022701760237205129, "2": 3.7303518462644584e-06}, "score": 4.989881803811982}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947283670837846, "4": 0.004573264483930389, "3": 0.00042886387374827613, "1": 0.00026191697335939965, "2": 0}, "score": 4.993521290717377}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9957361467447886, "4": 0.0038414360920183683, "3": 0.00029232978275029446, "1": 0.0001255504359556402, "2": 0}, "score": 4.995071680239145}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9866808168825117, "4": 0.012625029085770017, "3": 0.00039734461736571014, "1": 0.0002930541950530359, "2": 1.8543895493003448e-06}, "score": 4.985402473983227}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9866298798135092, "4": 0.012417183494162258, "3": 0.0005006708293809959, "1": 0.00044671712216323077, "2": 0}, "score": 4.984794521987167}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9960472158990604, "4": 0.003849097783857431, "3": 7.093312685839704e-05, "1": 3.193282756620641e-05, "2": 0}, "score": 4.995881301273334}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957587191441956, "4": 0.004109820193381371, "3": 8.246711088891193e-05, "1": 4.591526157385293e-05, "2": 0}, "score": 4.995541570814208}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9961145031532576, "4": 0.0038028651861765506, "3": 5.6147690978664494e-05, "1": 2.5702070631231846e-05, "2": 0}, "score": 4.995982028007693}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.945035029425755, "4": 0.049709287107815726, "3": 0.00483437221638142, "1": 0.00040157602101394526, "2": 1.7156782182338403e-05}, "score": 4.93896403665083}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9709038473018248, "4": 0.027179414827942727, "3": 0.0017229884928732474, "1": 0.00018699886699094398, "2": 4.476007911402319e-06}, "score": 4.968613113305062}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9856340907223252, "4": 0.013247416853616911, "3": 0.0009090470545000458, "1": 0.00020377298548699693, "2": 2.5930156913477657e-06}, "score": 4.984111569122029}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9867317684220404, "4": 0.012533996580470238, "3": 0.0005921292613733758, "1": 0.00013924633487083057, "2": 0}, "score": 4.985724718738542}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9724790481892726, "4": 0.026247448360067777, "3": 0.0010884709127184555, "1": 0.0001779575534274417, "2": 0}, "score": 4.970863573461019}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9213757550419538, "4": 0.06993828980235221, "3": 0.007956015259546343, "1": 0.000707362495490084, "2": 1.732337174980838e-05}, "score": 4.911267793379768}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9925996726691575, "4": 0.007068245437201806, "3": 0.0001771843220009781, "1": 0.00015093534373999436, "2": 0}, "score": 4.99197361274146}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9865624587911138, "4": 0.012088247250622039, "3": 0.0009897858018627678, "1": 0.00035384733319917085, "2": 2.7548653261069064e-06}, "score": 4.984508482199179}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.991929705102415, "4": 0.007469185663775799, "1": 0.0004900488391949891, "3": 0.00010752738485508544, "2": 0}, "score": 4.990355530135727}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977703952693735, "4": 0.0021155869230354094, "1": 7.857876974810315e-05, "3": 3.307175378069876e-05, "2": 0}, "score": 4.997503948581549}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"5": 0.957934470262109, "4": 0.038886135724373314, "3": 0.0029027520767940106, "1": 0.0002697710288642014, "2": 5.3677002500963374e-06}, "score": 4.9542131040786215}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9467604580478312, "4": 0.04602361705527192, "3": 0.006169690527131548, "1": 0.001012585822107921, "2": 3.146423669936338e-05}, "score": 4.937492129355309}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9820435473899124, "4": 0.016382059104539746, "3": 0.0014801364492746623, "1": 9.288698674974277e-05, "2": 1.091761621282876e-06}, "score": 4.980282839277607}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9830134306585262, "4": 0.016303996779989144, "3": 0.0006136597110394605, "1": 6.661165471547795e-05, "2": 1.411311703291104e-06}, "score": 4.982197987402233}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.981037362505334, "4": 0.01843264502933244, "3": 0.0005016188447865989, "1": 2.556030489312672e-05, "2": 0}, "score": 4.980461821094457}]