[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9195409875687739, "2": 0.04040180971873931, "3": 0.03565447193559964, "5": 0.0043934943017588666, "1": 8.349950059646947e-06}, "score": 3.887910253708132}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9842641458984503, "3": 0.006038431416609122, "2": 0.00567258135166589, "5": 0.004022462506845377, "1": 2.2597960321817105e-06}, "score": 3.9866320874076195}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8467716578424169, "5": 0.15181777894939, "3": 0.0012931179000707292, "2": 0.00011657799779613172, "1": 2.935185491046932e-07}, "score": 4.150290710733653}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.523403762676505, "5": 0.4765645491022542, "3": 2.130056414327217e-05, "2": 9.752108889346202e-06, "1": 0}, "score": 4.476524047174338}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9090009906329741, "5": 0.08860790536613816, "3": 0.002288670952461629, "2": 6.69855254481641e-05, "1": 0}, "score": 4.086188318525181}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9719644551170233, "5": 0.025901976511578214, "3": 0.0011741791162569203, "2": 0.0009583370645164909, "1": 4.751259073171455e-07}, "score": 4.022809711051246}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9243640698082163, "2": 0.03314795346008624, "5": 0.029252966255544428, "3": 0.013185348868862622, "1": 4.537612374299883e-05}, "score": 3.9496353662584713}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5223681612230844, "2": 0.38217271081492765, "3": 0.09365545528000324, "5": 0.001688765314819453, "1": 0.00010795911147282655}, "score": 3.1433580589032992}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6858754963013856, "5": 0.31401667166777064, "3": 8.870591370627056e-05, "2": 1.859376962047695e-05, "1": 0}, "score": 4.313890945313889}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9364361863465197, "5": 0.03805210782574315, "3": 0.012745857017321572, "2": 0.012745857017321572, "1": 1.639065832098862e-05}, "score": 3.999765363953859}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8545205051924617, "5": 0.1394966349826261, "3": 0.0040828312393980494, "2": 0.0018986928561829895, "1": 6.173436493116413e-07}, "score": 4.131614660550002}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9499344022830459, "5": 0.04879573829290254, "3": 0.0008265604530019517, "2": 0.0004424259288311283, "1": 0}, "score": 4.047084367088878}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5620282463175178, "5": 0.4377080383403313, "3": 0.00018561647043158214, "2": 7.737645674970547e-05, "1": 0}, "score": 4.43736798491758}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6583296732175656, "5": 0.34153691813558507, "3": 0.0001093261436182144, "2": 2.3276879178353155e-05, "1": 0}, "score": 4.341381313258607}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8926071156454094, "5": 0.10660671252022412, "3": 0.0006854164145147397, "2": 0.00010029868236719231, "1": 0}, "score": 4.105720747027603}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9607161260290249, "5": 0.03843348093203822, "3": 0.0006510323006582681, "2": 0.00019855369314118856, "1": 0}, "score": 4.03738537141678}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9055633434423883, "5": 0.08966291760671886, "3": 0.0038784371611813957, "2": 0.0008928669324546856, "1": 9.82099706138717e-07}, "score": 4.08399592230722}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9560933062628652, "5": 0.04200781107560231, "3": 0.0012885019686643881, "2": 0.0006086452331380079, "1": 5.379366686379881e-07}, "score": 4.039500452133358}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9123927688680602, "5": 0.08755966782666379, "3": 4.078039935307197e-05, "2": 6.762053106783093e-06, "1": 0}, "score": 4.08750536514583}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.4934519651014883, "4": 0.42207183260022335, "3": 0.08441967402358694, "1": 2.9218631123036143e-05, "5": 1.5639606234285754e-05}, "score": 2.928591876113485}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9841579121285039, "5": 0.00906378024830822, "2": 0.0034943985737740098, "3": 0.003282683666880084, "1": 5.803009434234039e-07}, "score": 3.9987905577508607}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8912416911410297, "5": 0.09999453944849812, "3": 0.0062933327476310304, "2": 0.0024645045145216707, "1": 4.757610555004347e-06}, "score": 4.088758029089816}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9125358925478957, "5": 0.07490549699728197, "3": 0.007533443783145451, "2": 0.005018355442736253, "1": 5.6951079842896515e-06}, "score": 4.057318320978891}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.685755272864776, "5": 0.31396162936982563, "3": 0.00023004537175406857, "2": 5.2138391477600047e-05, "1": 0}, "score": 4.313627593871417}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8821559187241778, "3": 0.07241176447806769, "2": 0.043919955279838226, "5": 0.0015028589774378869, "1": 8.264750621365786e-06}, "score": 3.841226193159222}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9259638490507799, "5": 0.07140267109801522, "3": 0.0019632186190920646, "2": 0.0006679514945588021, "1": 1.0200381799960033e-06}, "score": 4.068100577204538}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9422058630614423, "5": 0.05658385962932832, "3": 0.0010526897748661136, "2": 0.00015646847593490623, "1": 3.068118940852258e-07}, "score": 4.0552173573170185}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8929322614696183, "5": 0.10664555642058211, "3": 0.0003906808780093574, "2": 3.108236317884488e-05, "1": 0}, "score": 4.106192755297027}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7430987172757931, "5": 0.2568080398061649, "3": 8.220441885392461e-05, "2": 1.0782873171793643e-05, "1": 0}, "score": 4.256704335261275}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9044655067784875, "5": 0.09532995447770995, "3": 0.0001783681295139065, "2": 2.5696365404855295e-05, "1": 0}, "score": 4.095100238718569}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt4", "target_model": "human", "scores": {"4": 0.742301688629486, "2": 0.1997877951437675, "3": 0.05724015593879451, "5": 0.0006458944872191305, "1": 2.3526714387858925e-05}, "score": 3.5437591396681642}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9738742718642367, "3": 0.018693152474785906, "2": 0.007206852279921987, "5": 0.00019508055151582187, "1": 2.7668305656335535e-05}, "score": 3.9670051204558594}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5311560082732423, "5": 0.46874353209033404, "3": 9.389579072167836e-05, "2": 6.193098692486094e-06, "1": 0}, "score": 4.4686374238481505}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9591537564222147, "4": 0.040845688823579494, "3": 2.9340732665256887e-07, "2": 8.538631456404073e-08, "1": 0}, "score": 4.959153461015443}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9873884476429722, "5": 0.008813752440801145, "3": 0.0023354119019822666, "2": 0.001461463424100747, "1": 4.751826882556627e-07}, "score": 4.003553989739742}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9891571263647948, "2": 0.003918086038108122, "5": 0.003918086038108122, "3": 0.003004100771111246, "1": 1.824824025431589e-06}, "score": 3.993072333343085}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9409311489813147, "2": 0.03536136637967998, "3": 0.023555748279568942, "5": 0.00014227339990966557, "1": 5.872324534748782e-06}, "score": 3.9058458373141445}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9488403540229929, "5": 0.05028669247503582, "3": 0.0007285971390774327, "2": 0.00014346922581701872, "1": 2.482660210876925e-07}, "score": 4.049270443563723}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7247941467224756, "5": 0.2751008283415445, "3": 8.272464462711788e-05, "2": 2.191984866230977e-05, "1": 0}, "score": 4.2749743686115815}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5233624886832353, "4": 0.4765269687037266, "3": 7.91349448570915e-05, "2": 3.0989689672795243e-05, "1": 1.5761570712343594e-07}, "score": 4.523221037739206}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9475276560578249, "5": 0.051811196729254425, "3": 0.0005666468430799935, "2": 9.39592857351028e-05, "1": 0}, "score": 4.051056658940652}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8951286482281461, "5": 0.10361865477197733, "3": 0.0006981769341524206, "2": 0.0005523034138084044, "1": 0}, "score": 4.101816096701055}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9902244766154892, "5": 0.006366540815448998, "3": 0.002532434970898353, "2": 0.0008751861074450104, "1": 4.3390119068489355e-07}, "score": 4.002082433857733}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6512482975790826, "5": 0.34858812894155133, "3": 9.5442221885728e-05, "2": 6.76786696047317e-05, "1": 0}, "score": 4.34835748704283}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9751977851429766, "5": 0.02154492476314573, "3": 0.002166830019446319, "2": 0.0010895505578729973, "1": 3.4876586981509495e-07}, "score": 4.01719795697411}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8325665586442262, "5": 0.16394207742104625, "3": 0.0030499889845264838, "2": 0.000439392573330011, "1": 8.482274650808581e-07}, "score": 4.160010940083776}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6366417649617586, "4": 0.36274756494644445, "3": 0.0004965640896149247, "2": 0.00011254313360278751, "1": 8.592774287430272e-07}, "score": 4.635917984198919}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9218482931647201, "4": 0.0780719376316594, "3": 6.482144940766605e-05, "2": 1.446362038738587e-05, "1": 0}, "score": 4.921754990727307}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.86337476824687, "4": 0.13660572801018028, "3": 1.5111840233230211e-05, "2": 4.131347223281364e-06, "1": 0}, "score": 4.863351618663198}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.507726074633068, "5": 0.49210498554458615, "3": 0.0001390135705142668, "2": 2.9138827348322418e-05, "1": 0}, "score": 4.491908081659843}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt4", "target_model": "human", "scores": {"5": 0.5774632355488115, "4": 0.4224811282696065, "3": 3.997585144635667e-05, "2": 1.5412063670191502e-05, "1": 0}, "score": 4.57739257891724}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.72480091633142, "5": 0.2751033867911449, "3": 7.771338890932057e-05, "2": 1.789063797671202e-05, "1": 0}, "score": 4.274989917659247}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8626280131900754, "5": 0.13648757420035115, "3": 0.0005845624145191423, "2": 0.00029856526673600225, "1": 5.854430066375939e-07}, "score": 4.135304219566655}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5467112747547427, "5": 0.4532395660092069, "3": 3.668256440956664e-05, "2": 1.1909085044597398e-05, "1": 0}, "score": 4.4531793224932175}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6925378675728531, "4": 0.3073118343034502, "3": 8.956750241811225e-05, "2": 5.9664819462494664e-05, "1": 3.2303085240616344e-07}, "score": 4.6923285155804715}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9815090202871567, "5": 0.012163823734784732, "2": 0.003652242194973505, "3": 0.0026720374705410045, "1": 1.98868090664452e-06}, "score": 4.002181337767801}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9882595913145477, "5": 0.005350528167766513, "2": 0.004948429626038734, "3": 0.001440075120127007, "1": 4.1971706812195036e-07}, "score": 3.994012328919818}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9711819442748488, "5": 0.02213729358810494, "3": 0.0037285286013602143, "2": 0.0029495088913435168, "1": 1.7096156137480424e-06}, "score": 4.012504631049777}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8596088145673599, "5": 0.1403272758308972, "3": 5.17012809583281e-05, "2": 1.1536115100110715e-05, "1": 0}, "score": 4.140252596598331}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9927371029416883, "2": 0.0038713019783717466, "3": 0.003311300057796254, "5": 7.090539742725244e-05, "1": 4.6767178882230815e-06}, "score": 3.9890029194010066}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt4", "target_model": "human", "scores": {"5": 0.6076246315463482, "4": 0.39231193620983223, "3": 5.234924724632062e-05, "2": 1.0635394664856725e-05, "1": 0}, "score": 4.607551283450886}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5774730294083381, "4": 0.4224882936103038, "3": 2.424699174568898e-05, "2": 1.3815519448086042e-05, "1": 0}, "score": 4.577421506185984}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.71213653735989, "4": 0.2877291766831232, "3": 0.00010274760642428962, "2": 3.085042596779806e-05, "1": 1.618881778886035e-07}, "score": 4.711971977760185}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8080479646761102, "4": 0.19192822595398074, "3": 1.732891611581957e-05, "2": 6.083021671490771e-06, "1": 0}, "score": 4.808018790849274}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6222492394457174, "5": 0.377413226610166, "3": 0.000175777775487902, "2": 0.00016004748588206816, "1": 5.594621282760822e-07}, "score": 4.376916108636292}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.97149585089231, "3": 0.016715509131778716, "5": 0.009524210009920417, "2": 0.002262198162793459, "1": 1.9078320746521326e-06}, "score": 3.9882785772589284}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9804984168327724, "5": 0.01234265289775431, "3": 0.006304010253001364, "2": 0.0008531550131164501, "1": 1.2239294676542202e-06}, "score": 4.0043286631722435}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8385246755053456, "5": 0.1600352460813041, "3": 0.0013419775088490842, "2": 9.721252468645762e-05, "1": 3.6742890235113734e-07}, "score": 4.158497823805961}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.679071849757712, "5": 0.32077084156434804, "3": 0.0001493969052507278, "2": 7.32271790798778e-06, "1": 9.812457422122536e-08}, "score": 4.320606662245053}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9861740398023473, "5": 0.011661971850090474, "3": 0.0018165848439807902, "2": 0.0003467012846206318, "1": 4.2542677304274955e-07}, "score": 4.009150710689394}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9223309748039518, "3": 0.05203436048817642, "4": 0.025359521953622257, "1": 0.0002525308849740575, "5": 2.1723802699002317e-05}, "score": 2.1025661360041012}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5466716669576964, "5": 0.4532067299921486, "3": 8.799047394241219e-05, "2": 3.287963792007825e-05, "1": 0}, "score": 4.453053312302488}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9646589401602156, "5": 0.031993238352310896, "3": 0.0027521972123891107, "2": 0.0005952043892860818, "1": 2.1929346090539262e-07}, "score": 4.0280499801075775}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8550505234814999, "5": 0.14401399451446195, "3": 0.0006774195213103776, "2": 0.00025711965442454265, "1": 2.963887202752903e-07}, "score": 4.142821538843637}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8882065603796847, "5": 0.10944851751124203, "3": 0.0017690705204757384, "2": 0.0005743331094033684, "1": 7.047476792283766e-07}, "score": 4.106528753214726}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9100522222772153, "2": 0.07470163496509144, "3": 0.011455870190094088, "5": 0.003777745031016888, "1": 1.061089770061484e-05}, "score": 3.8428864710877395}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8980030089156248, "5": 0.10075314124811989, "3": 0.0008854124290369204, "2": 0.0003577389598363929, "1": 0}, "score": 4.099152320152089}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8883398457735563, "5": 0.09660248629996579, "3": 0.012091216488754303, "2": 0.0029630800328685238, "1": 1.8282506084332e-06}, "score": 4.078579746254317}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.4999424235952696, "5": 0.4999424235952696, "3": 8.046912399275568e-05, "2": 3.40727708994199e-05, "1": 0}, "score": 4.499794114260984}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5076530688727757, "5": 0.49203422593540264, "3": 0.00027642196529469433, "2": 3.4598265749624864e-05, "1": 0}, "score": 4.491689435916024}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9780927764507473, "1": 0.01791439857175037, "3": 0.003874260395776689, "4": 0.00011699246815292354, "5": 0}, "score": 1.9861938250554574}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9456931200203322, "5": 0.03783248325545621, "2": 0.009127513184085254, "3": 0.007334162885057017, "1": 1.0039703259140243e-05}, "score": 4.012213207635472}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9373969192338988, "5": 0.040547814349865534, "3": 0.01827632815366364, "2": 0.0037715334860547803, "1": 6.0359699230410825e-06}, "score": 4.014710331449922}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.629582202642533, "5": 0.3701123021767274, "3": 0.00025876920342585657, "2": 4.5675477566603415e-05, "1": 3.22528607247886e-07}, "score": 4.369761483608035}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.49984016583237945, "5": 0.49984016583237945, "3": 0.0002852293398688246, "2": 3.353764562726895e-05, "1": 0}, "score": 4.499488311414918}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7197824970789286, "2": 0.2127672997310453, "3": 0.06489036016315003, "5": 0.0024770637302522, "1": 7.839064199820088e-05}, "score": 3.511814789702735}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.9208394954087706, "3": 0.04656786816677014, "4": 0.032509611334425474, "1": 5.895595018159745e-05, "5": 2.1352430158779444e-05}, "score": 2.11159249534033}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9936803618448606, "3": 0.0033666415642304636, "5": 0.002139967579135117, "2": 0.0008122400771394983, "1": 0}, "score": 3.997148843611249}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9825563334869747, "5": 0.007985741020943411, "3": 0.006517771864650747, "2": 0.0029377899441245256, "1": 7.323758488827749e-07}, "score": 3.9955901849467326}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9850611948387367, "5": 0.010943042639984104, "3": 0.0025589035833140927, "2": 0.0014354148176651826, "1": 5.542350290506019e-07}, "score": 4.00551165162099}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt4", "target_model": "human", "scores": {"4": 0.973144663545703, "5": 0.021499564497154, "2": 0.003049286652939933, "3": 0.0023017223234555713, "1": 3.8006137162349134e-06}, "score": 4.013087879622014}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7180286559043733, "5": 0.28118406176733174, "3": 0.0004570942280640498, "2": 0.0003292329510009113, "1": 5.878053389890724e-07}, "score": 4.280066841102093}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7979043028213206, "5": 0.20174178325944941, "3": 0.00028493029116976763, "2": 6.87426318673196e-05, "1": 1.2862160984882403e-07}, "score": 4.201319004462855}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9043814496604823, "5": 0.09532108920418511, "3": 0.00028058636044854307, "2": 1.6078879170016947e-05, "1": 0}, "score": 4.095008420702191}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8901358655372158, "5": 0.10968625673454763, "3": 0.00015251371980943404, "2": 2.4897180346550484e-05, "1": 0}, "score": 4.109483999764251}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9727932437039462, "4": 0.01987666993668137, "3": 0.00487098745308847, "1": 0.0024492863073131304, "5": 6.5645014085596665e-06}, "score": 2.042194871576423}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.8941586577817063, "3": 0.07572688724717956, "4": 0.029195315811223643, "1": 0.0008955056743210487, "5": 2.1060274861296485e-05}, "score": 2.133285536991661}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.7283534575491545, "4": 0.2022564565386108, "3": 0.06881427982387088, "5": 0.0004935709205967695, "1": 8.057323786519166e-05}, "score": 2.474728121389877}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.872498049882276, "5": 0.09487974797369537, "2": 0.017827376456955084, "3": 0.014779414183579502, "1": 1.3268145111310318e-05}, "score": 4.04440587161857}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7579146792737669, "2": 0.19771384913391235, "3": 0.034898567376509024, "5": 0.009392821985266822, "1": 7.634030617342044e-05}, "score": 3.5788359594584254}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9587925419283317, "5": 0.025550954625426833, "3": 0.008558499467905708, "2": 0.007095245266825295, "1": 1.8249535925369728e-06}, "score": 4.0027964923743395}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9827936917563943, "5": 0.014239563878174478, "3": 0.0020514036762986957, "2": 0.0009103048632479846, "1": 2.6380224327746028e-06}, "score": 4.010359661248512}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7200273367388093, "5": 0.27329157867669757, "2": 0.0043488623361783605, "3": 0.0023277782664952625, "1": 2.5604155203688304e-06}, "score": 4.262258888473289}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9241403453199457, "4": 0.0758580612496189, "3": 1.2473153952878455e-06, "2": 2.9167023647177694e-07, "1": 0}, "score": 4.92413856497862}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8623950402030158, "5": 0.13645071388476937, "3": 0.0006832384075022472, "2": 0.00046958243233451185, "1": 4.487535438573283e-07}, "score": 4.1348270959862}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6721708363558347, "5": 0.32758988616237883, "3": 0.00021516228513165917, "2": 2.3397813035257743e-05, "1": 2.0885658848669369e-07}, "score": 4.327327468136276}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7771209095298921, "5": 0.22264885273524768, "3": 0.00018199451658412665, "2": 4.7476106240488084e-05, "1": 0}, "score": 4.222372076590479}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8619587959353183, "5": 0.13638168728874522, "3": 0.0015150639949830847, "2": 0.00014314205917729947, "1": 4.774540079948155e-07}, "score": 4.134579018953741}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6370047924301809, "5": 0.36295442629344454, "3": 3.891608097848541e-05, "2": 1.7098532668348615e-06, "1": 0}, "score": 4.362912146881477}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9953528625134586, "5": 0.0041969059657184175, "3": 0.00034450302042062896, "2": 0.00010343853359330388, "1": 8.148327169902283e-07}, "score": 4.003643086754001}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9013690948820597, "5": 0.09801934714003628, "3": 0.0005738081792427751, "2": 3.725996992339856e-05, "1": 1.26238735062456e-07}, "score": 4.097370675707746}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9166793048276148, "5": 0.08264115318071694, "3": 0.0006211906613778633, "2": 5.7779703180637386e-05, "1": 1.6484701087271687e-07}, "score": 4.0819039418888385}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6366866243208944, "5": 0.36277306699664674, "3": 0.0005204313869604958, "2": 1.8956702405963267e-05, "1": 0}, "score": 4.362215055657554}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8478279270458772, "5": 0.1520071682056691, "3": 0.00014987604082802636, "2": 1.4160176572034493e-05, "1": 0}, "score": 4.151829103679988}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7976807693320997, "5": 0.2016852832991473, "3": 0.0005754135259986401, "2": 5.787083578648073e-05, "1": 0}, "score": 4.200994261362172}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.975539035334449, "3": 0.01435703805811122, "5": 0.0076847687002861206, "2": 0.002418119758742706, "1": 4.997589273967965e-07}, "score": 3.9884899856510363}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9737242619826608, "5": 0.02594887559451849, "3": 0.00024274404075310942, "2": 8.389009572744286e-05, "1": 5.5967089861953e-08}, "score": 4.025538187861763}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7876832869736374, "5": 0.21200209972414455, "3": 0.0002443805295905817, "2": 7.00161939869353e-05, "1": 0}, "score": 4.211617732638461}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6369833002510594, "5": 0.36294212234694634, "3": 6.415958901840619e-05, "2": 9.839191646701918e-06, "1": 0}, "score": 4.3628584943323}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8745239743294044, "3": 0.09510006746689229, "2": 0.029924563922255017, "5": 0.0004473359856256013, "1": 2.31101207887063e-06}, "score": 3.8454909376668134}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt4", "target_model": "human", "scores": {"4": 0.718525344430197, "5": 0.28137859592660835, "3": 8.330066713500157e-05, "2": 1.2189580847609073e-05, "1": 0}, "score": 4.281271076252183}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9524499474223136, "5": 0.04741969169251635, "3": 0.00011571937255123665, "2": 1.448397778244281e-05, "1": 0}, "score": 4.047275011811862}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9074220970490628, "5": 0.04310904254715001, "2": 0.03630145339801651, "3": 0.013147515152512668, "1": 1.79975845633053e-05}, "score": 3.9573045469682544}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8557837014437076, "5": 0.1441374962358352, "3": 6.92620791464541e-05, "2": 9.228278852712853e-06, "1": 0}, "score": 4.14404982253712}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9215389230212937, "5": 0.07804573328084283, "3": 0.00035582009712380235, "2": 5.900077373452815e-05, "1": 1.1569192473962134e-07}, "score": 4.077571596142594}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9669920450351116, "5": 0.031083908664000924, "3": 0.0011681721695530039, "2": 0.0007542286398859706, "1": 6.069526836976307e-07}, "score": 4.0284054878568245}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9917073671584646, "5": 0.008060118663930124, "3": 0.00017259245397471966, "2": 5.9646356058230207e-05, "1": 0}, "score": 4.007768235636958}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6986605688768508, "5": 0.3004901813249793, "3": 0.0006272188720596076, "2": 0.00022017453174832596, "1": 5.719495778866021e-07}, "score": 4.299421282130794}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9754507813346572, "5": 0.02441993187561073, "3": 0.00010458807694206852, "2": 2.4456708583142093e-05, "1": 0}, "score": 4.024266436254082}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9494382168391179, "5": 0.05031837300910961, "3": 0.00019318061068411652, "2": 4.9612883995046684e-05, "1": 0}, "score": 4.050025997479321}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8092698075876587, "3": 0.17501685419681823, "4": 0.015533633541490618, "1": 0.00015712042632340603, "5": 2.06097148226789e-05}, "score": 2.2059892367304665}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9569480502144999, "3": 0.020173589107203155, "2": 0.019249773202616657, "5": 0.003616924137881608, "1": 5.270522785744534e-06}, "score": 3.944927624989582}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7422059230435899, "5": 0.2564994906867474, "3": 0.0007317997843965066, "2": 0.0005610903576956936, "1": 0}, "score": 4.254645942098962}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7057221317873417, "5": 0.2941887826075705, "3": 6.677652241845952e-05, "2": 2.1679162764763043e-05, "1": 0}, "score": 4.294078833005733}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9431453646087201, "5": 0.05664027921304374, "3": 0.0001774786922351971, "2": 3.6624798219771314e-05, "1": 0}, "score": 4.056389565173323}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6925059007626856, "5": 0.30729760609490747, "3": 0.00017263811071663394, "2": 2.3364027611269355e-05, "1": 1.0486793923037517e-07}, "score": 4.307078043899082}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8511234383394144, "2": 0.08694773395444018, "3": 0.06165517569601564, "5": 0.0002330347439150384, "1": 3.463752243731995e-05}, "score": 3.7645770708029107}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9340484952425209, "5": 0.05971172972960506, "3": 0.004462808511662215, "2": 0.0017751825788867059, "1": 9.080403690747312e-07}, "score": 4.051695877219323}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7879245519220827, "4": 0.21206702470658764, "3": 7.736176381366264e-06, "2": 5.692318594315118e-07, "1": 0}, "score": 4.78791577022696}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7444569146925887, "3": 0.13771068225050764, "2": 0.11779020036230842, "1": 2.8461023590917855e-05, "5": 0}, "score": 3.6266184030670385}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9574126492750786, "3": 0.029829104530427822, "2": 0.01243461702936982, "5": 0.0003211760958659365, "1": 1.558719355201677e-06}, "score": 3.9456181127121974}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7533407200920977, "3": 0.14377758817203823, "2": 0.10195357666873046, "5": 0.0005105037881076067, "1": 0.0003975807499391226}, "score": 3.6516260419140902}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9139768372740817, "5": 0.08501309292008095, "3": 0.000758854878327085, "2": 0.00025024377880450877, "1": 3.4795245154448573e-07}, "score": 4.083752758821196}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.953673731074162, "5": 0.04460391694203321, "3": 0.0015995083151418483, "2": 0.00012142861484357073, "1": 4.6618466709487245e-07}, "score": 4.042760193417031}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9894142649638641, "5": 0.007321851835587239, "3": 0.0030048819388591415, "2": 0.0002584929854432555, "1": 3.0266416877297756e-07}, "score": 4.003799076714471}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9583522073372017, "5": 0.039555924431276854, "3": 0.00179313463131023, "2": 0.00029733086965511274, "1": 5.922038026935852e-07}, "score": 4.037166381573595}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8108180521799598, "5": 0.18666091442056096, "3": 0.0012976353920076647, "2": 0.0012190156380210856, "1": 2.7085774150428757e-06}, "score": 4.182917428186}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9728483004955284, "5": 0.02435478352699107, "3": 0.0021956496678628918, "2": 0.0006002572167668457, "1": 3.5340469214444125e-07}, "score": 4.020957572953151}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7371449871658067, "4": 0.2628371342586099, "3": 1.5084452203500348e-05, "2": 1.8587692180353901e-06, "1": 0}, "score": 4.737126874649857}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9414503568469929, "5": 0.05833321046752213, "3": 0.00015634303852433154, "2": 5.934112409429573e-05, "1": 0}, "score": 4.05805822863872}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9336063746517038, "3": 0.05104997112467132, "2": 0.012125430956331423, "5": 0.003212919351012156, "1": 4.262835537404945e-06}, "score": 3.927899222744334}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9230252485297086, "3": 0.04891855043201884, "2": 0.027440819813101338, "5": 0.0006062466751598693, "1": 6.52758183168852e-06}, "score": 3.8967862047963635}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.958432903990341, "3": 0.03331222940552947, "2": 0.007092582920897118, "5": 0.0011578323335440432, "1": 3.2016924415057343e-06}, "score": 3.95365077408825}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8558176596147066, "5": 0.14414320419370294, "3": 3.7074802388562485e-05, "2": 1.7890550187460357e-06, "1": 0}, "score": 4.144102590525337}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9414482442347624, "5": 0.05833308213460026, "3": 0.0002071202532087027, "2": 1.1325417748394988e-05, "1": 0}, "score": 4.0581033242911095}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9717293614636666, "5": 0.022149773683331677, "3": 0.0036727925259670766, "2": 0.002446607274612492, "1": 1.1941773735081439e-06}, "score": 4.013580187754553}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7548535515537457, "5": 0.24506507290743818, "3": 7.031805248555141e-05, "2": 1.0616438035116063e-05, "1": 0}, "score": 4.2449736300240835}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.901909980309687, "5": 0.09213591086910765, "3": 0.0052798082405559965, "2": 0.0006712522904036879, "1": 1.3162273258123382e-06}, "score": 4.085509797474116}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6513087557646702, "5": 0.34862044455890995, "3": 6.259838993983026e-05, "2": 7.835107200427902e-06, "1": 0}, "score": 4.348542303583539}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9645802947228491, "5": 0.03513483466695379, "3": 0.00026825782669781957, "2": 1.636383239908681e-05, "1": 0}, "score": 4.034833857847385}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt4", "target_model": "human", "scores": {"4": 0.964407739992146, "2": 0.02065101103997556, "3": 0.011053689669618751, "5": 0.0038802100120296193, "1": 5.566511510296187e-06}, "score": 3.951507712277104}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9021770158526479, "5": 0.07883134358290048, "2": 0.009713929428615433, "3": 0.009269096213539114, "1": 6.898586654660722e-06}, "score": 4.0501137787642305}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9281073258756241, "5": 0.05750647090686543, "3": 0.0084150542881959, "2": 0.005967167021306053, "1": 2.822936225460497e-06}, "score": 4.037148656821627}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.927848225202599, "5": 0.06721310739177912, "2": 0.0027742154291309556, "3": 0.0021605611486159616, "1": 1.939632569484276e-06}, "score": 4.059498412580216}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9953859281870844, "5": 0.002795833516047888, "2": 0.0009512344460371086, "3": 0.0008661088192183843, "1": 3.292333720842436e-07}, "score": 4.000026268119502}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9868426240955515, "5": 0.006754005112906646, "2": 0.0036720888863299313, "3": 0.00272886474662324, "1": 1.3742258549222161e-06}, "score": 3.996676836450222}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9344971704191364, "5": 0.04800276814737991, "2": 0.009019452907658727, "3": 0.008472991880885595, "1": 6.208309011407943e-06}, "score": 4.02147227576432}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9836281369100371, "3": 0.007628363034647529, "2": 0.00508158529565712, "5": 0.0036601285838006982, "1": 1.6522344071225684e-06}, "score": 3.9858636363611724}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8476379077132421, "5": 0.15197310721595064, "2": 0.000201635085841001, "3": 0.00018648196984279736, "1": 0}, "score": 4.151383486477581}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9799904110580815, "5": 0.01851891938515857, "2": 0.0008661411256798528, "3": 0.0006238580496553866, "1": 2.52441322847221e-07}, "score": 4.016162028514935}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8841099555263238, "2": 0.0797049170985958, "3": 0.03220369762339152, "5": 0.003968275347325144, "1": 1.1146065414025441e-05}, "score": 3.81232092840731}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8590990887858675, "5": 0.14024407240001835, "2": 0.0003586652699893407, "3": 0.00029734395250119835, "1": 0}, "score": 4.139229513411177}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9664074043934187, "5": 0.03205123060310016, "3": 0.0010143120292456826, "2": 0.000526218148613188, "1": 2.450827324339538e-07}, "score": 4.029983764711142}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8354748108456749, "5": 0.16451474130423413, "3": 8.332225255044973e-06, "2": 1.918187170454845e-06, "1": 0}, "score": 4.164502605183648}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9193075917141017, "5": 0.08032819490849745, "3": 0.0002364534968552064, "2": 0.00012656443650502835, "1": 0}, "score": 4.07983870798134}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9772926083536321, "3": 0.011923796139097793, "5": 0.006185983945614168, "2": 0.004597032924558442, "1": 3.8991229801341404e-07}, "score": 3.9850669494022686}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.4570519127044617, "2": 0.4429899036741451, "3": 0.09884440815094947, "5": 0.0010477780498574015, "1": 6.29239942741689e-05}, "score": 3.0160317664139353}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.5736175465184122, "4": 0.2709577701364367, "3": 0.15438708365113105, "5": 0.0009471602125957333, "1": 8.809956170554086e-05}, "score": 2.6990576407388445}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8749899223544915, "5": 0.12217595734578239, "2": 0.001537968329674257, "3": 0.0012950991798584112, "1": 6.624683856488367e-07}, "score": 4.117802980082491}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9160751739906428, "5": 0.08258669408423046, "3": 0.00115977182012729, "2": 0.0001778567690233029, "1": 1.7536312725551468e-07}, "score": 4.081070709225667}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9382514176658652, "5": 0.026616142136898356, "2": 0.023488662994564133, "3": 0.011627731353111265, "1": 1.361467912326313e-05}, "score": 3.967970162887296}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9710027486046688, "5": 0.025876346243907607, "3": 0.0021914847430611153, "2": 0.0009279330241822652, "1": 6.00021109409489e-07}, "score": 4.021827214757819}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5763735524102226, "5": 0.42168389905481524, "3": 0.0014972517769668537, "2": 0.000442586779889167, "1": 1.3653155279943159e-06}, "score": 4.419297941585738}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.49997607085259504, "5": 0.49997607085259504, "3": 3.515671217151181e-05, "2": 1.2149834617484847e-05, "1": 0}, "score": 4.499916890299343}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8581728267498918, "5": 0.14009285867406232, "3": 0.000973901878652108, "2": 0.0007584755457289739, "1": 9.453609733579533e-07}, "score": 4.137599306090743}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6224064270089983, "5": 0.3775085732329792, "3": 7.802065177288972e-05, "2": 6.817368575047102e-06, "1": 0}, "score": 4.377416978886601}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5231601016820077, "4": 0.47634269324210016, "3": 0.00034902475745896884, "2": 0.00014778633644034695, "1": 0}, "score": 4.522515710113448}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8278543879713769, "5": 0.16301419436058665, "3": 0.007866295806275694, "2": 0.0012642287835398142, "1": 3.801621365858688e-07}, "score": 4.152618378781244}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9196322105593262, "4": 0.08035656380235309, "3": 1.0072959516731922e-05, "2": 8.140199195920354e-07, "1": 0}, "score": 4.919620820997732}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.798179060589201, "4": 0.20181125491428475, "3": 8.473668721885024e-06, "2": 1.2594984144841413e-06, "1": 0}, "score": 4.798168029076315}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt4", "target_model": "human", "scores": {"2": 0.49773767389045287, "4": 0.3529488617877298, "3": 0.14713097536806377, "5": 0.002002603890435917, "1": 0.00017498557780145076}, "score": 2.8588657330372493}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8618205574503699, "5": 0.13635981342043524, "3": 0.0010910843071523975, "2": 0.0007268188399484113, "1": 8.780318222039848e-07}, "score": 4.1338125708043245}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6583542754571438, "4": 0.34154969185519035, "3": 8.648738437834143e-05, "2": 8.974377368317868e-06, "1": 0}, "score": 4.6582502151301375}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9196400780465407, "4": 0.08035724683604832, "3": 1.80599657396613e-06, "2": 5.094047244018047e-07, "1": 0}, "score": 4.919637584048974}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.8840346767686493, "4": 0.11596011305278511, "3": 4.230209664748718e-06, "2": 5.378108061840087e-07, "1": 0}, "score": 4.8840297618182875}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6508493153515033, "5": 0.3483745447368886, "3": 0.0006518298476227171, "2": 0.00012247519968825712, "1": 0}, "score": 4.347478402065604}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9615317953628014, "4": 0.038466109426269206, "3": 1.1100533286114473e-06, "2": 6.035255264225595e-07, "1": 0}, "score": 4.96152984520905}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.766152402617952, "4": 0.2336632973614835, "3": 0.000151091491599953, "2": 3.16704971409946e-05, "1": 0}, "score": 4.765939148170854}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9755752265528886, "4": 0.024423048057726247, "2": 6.938722300121808e-07, "3": 4.410520240896679e-07, "1": 0}, "score": 4.975573973798819}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7979918856040535, "5": 0.20176393572339935, "3": 0.00017832434551281687, "2": 6.45847979965388e-05, "1": 0}, "score": 4.2014566975370204}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt4", "target_model": "human", "scores": {"5": 0.6981328812883844, "4": 0.3002632167020031, "3": 0.001368936661498467, "2": 0.00023419768302417523, "1": 4.052668896849339e-07}, "score": 4.696294585796074}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5156050312066062, "5": 0.4843661015678357, "3": 2.4531807920111562e-05, "2": 4.004707555340687e-06, "1": 0}, "score": 4.484333720518849}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5539698810768654, "5": 0.44512730458910577, "3": 0.0007947205615535095, "2": 0.0001075537322918041, "1": 0}, "score": 4.4441177164043815}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7930187287775614, "4": 0.20687130376653193, "3": 9.338461013699476e-05, "2": 1.5976223056084878e-05, "1": 0}, "score": 4.7928938727087464}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9823917867668212, "3": 0.007384367597824994, "5": 0.007046212785811492, "2": 0.0031759769283406605, "1": 0}, "score": 3.993309880252993}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt4", "target_model": "human", "scores": {"4": 0.930713707255531, "2": 0.04353005760842065, "3": 0.024802679184825725, "5": 0.0009467943952677738, "1": 4.249632709740539e-06}, "score": 3.8890709724502686}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8262040682349046, "5": 0.17318179466714165, "3": 0.0005686964761475368, "2": 4.454378143436755e-05, "1": 2.8194946054366943e-07}, "score": 4.172523270862736}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8345009645826238, "5": 0.16432299604131942, "3": 0.0010081164401324557, "2": 0.00016716202605576111, "1": 0}, "score": 4.162980679562683}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8805643590178993, "5": 0.11917142216889674, "3": 0.00022648824790872136, "2": 3.697319009465839e-05, "1": 0}, "score": 4.118871077570805}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9573675217360166, "5": 0.04206379014300083, "3": 0.00046004189340887716, "2": 0.00010757546034018603, "1": 0}, "score": 4.041388641646512}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9565159603895579, "5": 0.04336043021358261, "3": 0.0001091724298971046, "2": 1.4320306400180942e-05, "1": 0}, "score": 4.0432226222132615}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9040856332769632, "5": 0.09528991477476234, "3": 0.000524032946824786, "2": 0.00010001343810045017, "1": 0}, "score": 4.094565893304197}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9883626430087963, "5": 0.004039213032174942, "3": 0.003976590838482043, "2": 0.0036207271614068174, "1": 2.7962120191748155e-07}, "score": 3.9928203250847445}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5850973999313447, "5": 0.4148961836193636, "3": 5.744733706253969e-06, "2": 4.161471139075124e-07, "1": 0}, "score": 4.414889712624159}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9187529110227263, "2": 0.04433468283520211, "3": 0.036754743015675335, "5": 0.00015257366948065806, "1": 3.0691405091769603e-06}, "score": 3.8747190044546227}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8518939940693854, "2": 0.08175379894575663, "3": 0.06366992263801745, "5": 0.0026693560911982507, "1": 1.1981233587525356e-05}, "score": 3.7754556792124814}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8799076501747708, "5": 0.11908255344011599, "3": 0.0009380678282549157, "2": 7.121457894809235e-05, "1": 0}, "score": 4.118002117104447}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8123804045600762, "5": 0.18702058275052183, "3": 0.0005505121121249911, "2": 4.810319302498477e-05, "1": 0}, "score": 4.186373938314416}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7606278259099372, "4": 0.2393421645616797, "3": 2.647695039181173e-05, "2": 3.212018507211101e-06, "1": 0}, "score": 4.760595168738527}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8721013803166672, "3": 0.08369302820481152, "2": 0.043419371045534415, "5": 0.00078292441437373, "1": 2.268880545210492e-06}, "score": 3.8302441731141856}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5599300577098005, "5": 0.4360739674096096, "3": 0.0034892491820344793, "2": 0.0005026740046806399, "1": 2.291751925310358e-06}, "score": 4.431573254506312}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5386608644871946, "5": 0.46074105344249866, "3": 0.00048357990162620565, "2": 0.00011307949398383732, "1": 0}, "score": 4.460031969028746}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7171410322688091, "5": 0.2808364521238152, "3": 0.001618536391730948, "2": 0.00040288556264619056, "1": 4.5721733050622973e-07}, "score": 4.278410950145458}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5543969846856123, "5": 0.44547049198003796, "3": 0.00010111531092816898, "2": 3.083842748595261e-05, "1": 0}, "score": 4.4453079534597375}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5466209928429511, "5": 0.4531647196754866, "3": 0.00017226096372905121, "2": 4.155989160057516e-05, "1": 0}, "score": 4.452909550268034}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9855385647387573, "5": 0.01044698352641831, "3": 0.0027252584808707555, "2": 0.0012873209539371335, "1": 0}, "score": 4.005147092774576}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7979319985603284, "5": 0.2017488241705484, "3": 0.00026352640138303763, "2": 5.52381345448355e-05, "1": 1.6515903149279422e-07}, "score": 4.201374375878073}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6788439711163711, "5": 0.32066320893168504, "3": 0.00038737629455377133, "2": 0.00010426091526338839, "1": 3.701938683567366e-07}, "score": 4.320066460294445}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7431619056461386, "4": 0.2568298694172938, "3": 5.682655027645682e-06, "2": 2.2253596832892498e-06, "1": 0}, "score": 4.743152007792858}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.977910574739111, "2": 0.013519975777147848, "3": 0.00846058465158053, "5": 8.692525035047558e-05, "1": 1.7386143840317494e-05}, "score": 3.9645340691210373}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7876354918019041, "5": 0.21198923158724323, "3": 0.00029019135725131867, "2": 8.445049949877591e-05, "1": 0}, "score": 4.211530273500704}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9966827221646154, "3": 0.0016979687419635971, "5": 0.0009524741408936825, "2": 0.0006649341132742704, "1": 9.391195965317315e-07}, "score": 3.9979218178149636}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8620301087363194, "5": 0.13639298015997114, "3": 0.0010913498002602547, "2": 0.00048428353822301185, "1": 4.020899568910875e-07}, "score": 4.134331974644582}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8174960238619402, "5": 0.1824080260213402, "3": 7.497288823359774e-05, "2": 2.08192191559095e-05, "1": 0}, "score": 4.182291443498544}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9316708890464437, "5": 0.06749000946390887, "2": 0.0004619053767910456, "3": 0.00037699618120397256, "1": 0}, "score": 4.066189215762442}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8021144624820693, "5": 0.19656661450648757, "3": 0.0010980120076781457, "2": 0.00021961621769184345, "1": 5.113922135285589e-07}, "score": 4.195027988670514}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.585092455879204, "4": 0.4148926777614243, "3": 1.3567138173287386e-05, "2": 9.52562609830789e-07, "1": 0}, "score": 4.585077186437843}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8516755197982772, "5": 0.1479990239754856, "3": 0.0002601375573823702, "2": 6.475335785271854e-05, "1": 0}, "score": 4.147609463147651}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6992378869272908, "4": 0.3007384887516031, "3": 2.0496344598248457e-05, "2": 3.0944851952263822e-06, "1": 0}, "score": 4.699211225029804}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.651313399612654, "4": 0.34862295463514703, "3": 5.1091674482856044e-05, "2": 1.2135336372126484e-05, "1": 0}, "score": 4.651238309965832}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8803319559236027, "2": 0.10190582260532396, "3": 0.01336713762724428, "5": 0.004339674212203493, "1": 5.2126765912599214e-05}, "score": 3.7870038118386904}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9895470874074921, "2": 0.004727976354755919, "3": 0.003919630068161083, "5": 0.0017667156872095875, "1": 2.855629944903992e-05}, "score": 3.988305346664898}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6442237792040492, "4": 0.3557741356145264, "3": 1.4335825026256077e-06, "2": 5.52695289969915e-07, "1": 0}, "score": 4.644221303946792}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6992493475301769, "4": 0.3007433908289216, "3": 6.349572945489847e-06, "2": 7.236210450725555e-07, "1": 0}, "score": 4.699241682485076}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7981838416960932, "4": 0.20181248596669446, "3": 2.883037880873856e-06, "2": 7.176448702051972e-07, "1": 0}, "score": 4.7981795805616}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6785404124648096, "5": 0.3205198083522604, "3": 0.000546043999664547, "2": 0.0003933007388251704, "1": 3.0676403516284134e-07}, "score": 4.319186283336674}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9453001971430903, "2": 0.03443255830022136, "3": 0.01551996530084283, "5": 0.004733321987750614, "1": 1.137175964594408e-05}, "score": 3.920313918778491}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9517261653562631, "5": 0.036902432821020244, "2": 0.006215382570005202, "3": 0.005152733131165243, "1": 2.362646899096104e-06}, "score": 4.019311864443164}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8262949887329272, "5": 0.1732008457123433, "3": 0.0003970578777975335, "2": 0.000106866624610039, "1": 8.078867840394253e-08}, "score": 4.172589839879167}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5466937529391754, "5": 0.45322503991389823, "3": 6.960897832647102e-05, "2": 1.1542300115240355e-05, "1": 0}, "score": 4.45313237165116}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7781626772025735, "2": 0.16311175493540825, "3": 0.04600778305303953, "5": 0.012382826821850013, "1": 0.0003299910582773824}, "score": 3.639159768455405}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9048867873122692, "2": 0.05968374939958337, "3": 0.03508626625024912, "1": 0.0002763907313773654, "5": 6.463076643164488e-05}, "score": 3.844781355838501}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.9095198919138192, "3": 0.07236095649372856, "4": 0.015895589470954985, "1": 0.002219521604030507, "5": 2.944819597360546e-06}, "score": 2.10194155998755}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9243678412213148, "5": 0.07354225058707399, "3": 0.0017027341437982346, "2": 0.00038591439025574905, "1": 4.448538658770169e-07}, "score": 4.071066411006341}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5128385503560091, "2": 0.2922065978527586, "3": 0.19465155816501864, "5": 0.00016674514317158645, "1": 0.00012986124807538505}, "score": 3.2207071962143226}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6512471123082596, "5": 0.34858746662473555, "3": 0.0001478235832900361, "2": 1.7111821799711397e-05, "1": 0}, "score": 4.3484055886051705}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8518009297342651, "5": 0.14802081103530307, "3": 0.00016537796611473332, "2": 1.2752579411969087e-05, "1": 0}, "score": 4.147829946933847}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9390969565429522, "5": 0.06003445689579644, "3": 0.0007919901524519016, "2": 7.60049567051543e-05, "1": 0}, "score": 4.05909049177913}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5850811051956619, "4": 0.4148846289215497, "3": 3.0099409630693993e-05, "2": 3.767382856855613e-06, "1": 0}, "score": 4.585043704505585}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8394542673546949, "5": 0.16021264738374325, "3": 0.00027723972301367154, "2": 5.5451433077628204e-05, "1": 0}, "score": 4.159824567782311}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt4", "target_model": "human", "scores": {"4": 0.948959501693378, "2": 0.03456584925813529, "3": 0.01374934626999737, "5": 0.002707406806987719, "1": 1.635234901988033e-05}, "score": 3.9197771811399136}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9326484018977277, "2": 0.057787834571396135, "3": 0.007232995595936085, "5": 0.0023118042470211754, "1": 1.5576814488689365e-05}, "score": 3.8794560007975587}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9913333795593529, "5": 0.0039885441075221935, "2": 0.002575197625614356, "3": 0.002101815045858046, "1": 3.893823777155967e-07}, "score": 3.9967351634618913}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9601658586654496, "5": 0.03963077960030126, "3": 0.0001301400994136503, "2": 7.300197955439893e-05, "1": 0}, "score": 4.039354644186234}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9742304438454413, "5": 0.02438938456890227, "3": 0.0007963416146908624, "2": 0.0005826159712884395, "1": 0}, "score": 4.022427838239023}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9447820320579774, "2": 0.036633176038954274, "3": 0.017853584117784305, "5": 0.0007254807640868579, "1": 4.450803127412981e-06}, "score": 3.9095920767787873}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8738352781718722, "5": 0.12588790636649713, "3": 0.0002355437233399606, "2": 4.093136165978561e-05, "1": 0}, "score": 4.125570542661116}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8437709900571982, "5": 0.15608193269867524, "3": 0.00011616499578751132, "2": 3.0303449713466564e-05, "1": 0}, "score": 4.155905255718366}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.679136323899667, "5": 0.32080131624182096, "3": 5.0046499235199155e-05, "2": 1.2074279849465234e-05, "1": 0}, "score": 4.320727197862162}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9796519827796727, "5": 0.019706477306419435, "3": 0.0004353727488027767, "2": 0.00020565552450934753, "1": 0}, "score": 4.018859803158039}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8248909938861995, "3": 0.10164651741963482, "2": 0.0606959077995905, "5": 0.012722553428267308, "1": 4.1778487668074e-05}, "score": 3.78955841166781}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9656652644046704, "3": 0.021003566969333705, "5": 0.007848459566586523, "2": 0.005479107808197913, "1": 2.632864871193724e-06}, "score": 3.975878755027559}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9484510298364894, "5": 0.034547330382093885, "3": 0.014858621645760173, "2": 0.0021405874034922685, "1": 1.5441298656836373e-06}, "score": 4.015402915196012}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8870877256863763, "5": 0.11278055945820536, "3": 0.0001240518418865468, "2": 7.108736765833016e-06, "1": 0}, "score": 4.112642352577826}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9750376113351062, "5": 0.016516357921425404, "3": 0.006673211838152222, "2": 0.0017682251068369074, "1": 3.413477471274994e-06}, "score": 4.006296462869034}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9672625447349638, "5": 0.03109260093998693, "2": 0.0009243590310968927, "3": 0.0007198915372573851, "1": 0}, "score": 4.028524008562097}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.577383406774788, "4": 0.4224227242908913, "3": 0.0001556346942991671, "2": 3.6393367917161894e-05, "1": 0}, "score": 4.577156047815123}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9504950793252344, "3": 0.02003755131703427, "2": 0.017683080509278366, "5": 0.01177947109881116, "1": 2.9828003020883706e-06}, "score": 3.9563667302974745}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6859167255165999, "5": 0.31403557604042087, "3": 3.212908060795132e-05, "2": 1.4941410077737766e-05, "1": 0}, "score": 4.313973761300201}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.988514508688168, "5": 0.007090127184666879, "3": 0.00219641893867146, "2": 0.00219641893867146, "1": 0}, "score": 4.000500871633979}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9402013824636754, "3": 0.03319316824458314, "2": 0.025850865421502237, "5": 0.0007448809135094742, "1": 8.274881144555568e-06}, "score": 3.9158250369742786}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.4958402900380727, "2": 0.32013855260666024, "3": 0.18240944880949206, "1": 0.0014369227947731676, "5": 0.00014227453810141777}, "score": 3.173118069196473}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9663951571899874, "5": 0.022727434862356993, "3": 0.00932732047411292, "2": 0.0015466213521811833, "1": 1.304347033345373e-06}, "score": 4.010302980915501}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7430307862962321, "5": 0.256784568623976, "3": 0.00017401083335968795, "2": 9.971615011476957e-06, "1": 0}, "score": 4.256590784585709}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9839697571557658, "5": 0.015415065015119724, "3": 0.0005703359413254512, "2": 4.467216308992385e-05, "1": 0}, "score": 4.014755387251968}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9217618923734381, "2": 0.06471784526319847, "3": 0.013355286233039264, "1": 9.72992769442328e-05, "5": 5.810005194760555e-05}, "score": 3.856973855728695}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.943473342891312, "2": 0.03228388143787375, "3": 0.013249280896300545, "5": 0.010984039657984465, "1": 7.800579750840584e-06}, "score": 3.933143483530119}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5697175541492921, "4": 0.4300453718202024, "3": 0.00017675623111073951, "2": 5.920592124770444e-05, "1": 0}, "score": 4.569423019204697}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5077791093912555, "5": 0.4921563885948039, "3": 4.5135837677904215e-05, "2": 1.881541645429247e-05, "1": 0}, "score": 4.49207389293874}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9593451698557015, "5": 0.03605338940913058, "2": 0.0029135605180474864, "3": 0.0016862394617162726, "1": 1.073454076252527e-06}, "score": 4.028536824738068}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9842453289163812, "5": 0.014944977332132185, "3": 0.0006669769969331164, "2": 0.00014200759725477413, "1": 0}, "score": 4.013993995064633}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8007699152948159, "5": 0.19623711117848383, "3": 0.0022846167339896357, "2": 0.0006545536532750916, "1": 0}, "score": 4.192653752514653}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7821830394758988, "5": 0.21720438551260948, "3": 0.0005300487894971334, "2": 8.12856145395273e-05, "1": 0}, "score": 4.216512034100477}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8558484696050292, "4": 0.14414839344245983, "3": 1.7340740080159782e-06, "2": 9.57646619690833e-07, "1": 0}, "score": 4.8558452012873525}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7879231336591657, "4": 0.21206664298628672, "3": 8.630311141867672e-06, "2": 1.2433142022814984e-06, "1": 0}, "score": 4.787912292275558}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6963177538108546, "2": 0.22606127231889236, "3": 0.07572104135713832, "5": 0.0018373168597642373, "1": 5.906045367990281e-05}, "score": 3.4738146788099207}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5156169676012419, "5": 0.4843773147728793, "3": 4.263091315210452e-06, "2": 8.797386167638103e-07, "1": 0}, "score": 4.484371570619147}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9586275287574559, "5": 0.04082327885940975, "3": 0.0004606474767547699, "2": 8.791606548067408e-05, "1": 0}, "score": 4.040186824522813}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6513409637789793, "5": 0.34863770169802627, "3": 1.9092365783707325e-05, "2": 1.5918765778874817e-06, "1": 0}, "score": 4.348615652277093}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5078046767130652, "4": 0.49218116929281847, "3": 1.1235771335370328e-05, "2": 2.212454555859036e-06, "1": 0}, "score": 4.507789374414224}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9809655404460992, "5": 0.012348533103589361, "2": 0.003885638339142994, "3": 0.0027987203055636297, "1": 7.311899949173425e-07}, "score": 4.001776344035872}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9038815553654775, "5": 0.09526841026787256, "3": 0.0007864888596728621, "2": 6.257266728793197e-05, "1": 0}, "score": 4.09435686786773}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6150147916508834, "5": 0.384866422285422, "3": 0.00010213306868230491, "2": 1.6159798079982108e-05, "1": 0}, "score": 4.3847321593693}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8266078088481486, "5": 0.1732664146405823, "3": 8.325936024905716e-05, "2": 4.186543549488445e-05, "1": 0}, "score": 4.173099537220999}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8740137248152121, "5": 0.12591360271040922, "3": 5.5090459809482796e-05, "2": 1.7066228307913213e-05, "1": 0}, "score": 4.125824444692504}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9526830423475818, "3": 0.03062394376555547, "2": 0.015641181550677046, "5": 0.0010478938357289622, "1": 2.4400964274336893e-06}, "score": 3.9391341754779403}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7662827898659899, "5": 0.23370304686896443, "3": 1.0946902701765175e-05, "2": 2.9463188920737346e-06, "1": 0}, "score": 4.2336862704339255}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6858430140070675, "5": 0.31400181903046837, "3": 0.0001373838122350405, "2": 1.692900728470535e-05, "1": 0}, "score": 4.313830845260067}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9796660604798132, "5": 0.01910044587425867, "3": 0.0008658545669951146, "2": 0.0003666258911442469, "1": 0}, "score": 4.017501357257137}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9415430264832853, "5": 0.05833895073784881, "3": 0.00010746342509101336, "2": 9.995655593669006e-06, "1": 0}, "score": 4.058211528815304}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9834941296565181, "5": 0.011999461562409797, "3": 0.002635931892813055, "2": 0.0018691556016776512, "1": 5.038339940582851e-07}, "score": 4.005623711561377}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8986264707610625, "5": 0.10082309827923923, "3": 0.00043861522932503607, "2": 0.0001108992972963483, "1": 0}, "score": 4.100162776247802}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.679087251281917, "5": 0.3207780910672865, "3": 0.00010760902912026965, "2": 2.6786005223252943e-05, "1": 0}, "score": 4.320616994227017}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8080641662002217, "4": 0.19193206455688572, "3": 3.1069655980987607e-06, "2": 5.484120042006068e-07, "1": 0}, "score": 4.808060054420606}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9473484235197444, "2": 0.03241647816921536, "3": 0.017351297352926426, "5": 0.002877127150135055, "1": 5.730464304882017e-06}, "score": 3.920675607235699}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9611867327631373, "5": 0.03289000390671296, "3": 0.004521273848291075, "2": 0.0014006252989061277, "1": 5.001603949831602e-07}, "score": 4.025566001069026}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7544969071404983, "5": 0.24494928251740644, "3": 0.0004583149254466993, "2": 9.457863056231161e-05, "1": 2.0052458084171182e-07}, "score": 4.244301383740771}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.765481631193898, "5": 0.23345869794062488, "3": 0.0009691172038327582, "2": 9.014194169977037e-05, "1": 0}, "score": 4.232309392499802}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9019088204541982, "4": 0.09807801947037535, "3": 1.0192412367840451e-05, "2": 2.7864504841589007e-06, "1": 0}, "score": 4.901893218575254}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9275376892649942, "2": 0.049157699084864746, "3": 0.023220452857397694, "5": 6.729181152259643e-05, "1": 1.3459209029485352e-05}, "score": 3.8784906490811193}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9548564155638996, "2": 0.021427732172318033, "3": 0.015433821135588204, "5": 0.008261129148541527, "1": 1.9539568392538748e-05}, "score": 3.9499131567242607}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8516251276486372, "5": 0.14799024789357726, "2": 0.00019944261642045714, "3": 0.00018445426710119453, "1": 2.447303120092907e-07}, "score": 4.147406245376914}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7824394654559362, "5": 0.21727559678106978, "3": 0.00020763828635524055, "2": 7.63858567501618e-05, "1": 2.887114761332087e-07}, "score": 4.216914456198453}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774836781091811, "5": 0.42249608436626857, "3": 1.2978713053818065e-05, "2": 6.839301167797667e-06, "1": 0}, "score": 4.4224696042812415}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8902407297185552, "5": 0.1096991785366702, "3": 4.169985109621777e-05, "2": 1.821731577467696e-05, "1": 0}, "score": 4.10962106319144}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7116466634122469, "5": 0.28753125833826326, "3": 0.0007469228185926349, "2": 7.395535186696389e-05, "1": 3.319441848782192e-07}, "score": 4.286635677821802}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9516265181816365, "3": 0.02135524931443267, "5": 0.020698217366076306, "2": 0.006312600902209338, "1": 5.756346918467864e-06}, "score": 3.986700475157337}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9503145014651978, "2": 0.02454585691704125, "3": 0.01852818486573854, "5": 0.00660642644436521, "1": 3.076902957948466e-06}, "score": 3.938977177833402}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8590217733471237, "5": 0.1402314510014738, "3": 0.0006294205019903065, "2": 0.0001164310855885251, "1": 3.120551193989756e-07}, "score": 4.1393683174575715}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.983482715289887, "3": 0.00750898181220573, "5": 0.004924510500791014, "2": 0.004082562597940895, "1": 5.117625955532678e-07}, "score": 3.989248860485205}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9785588802163238, "5": 0.01737150602220904, "2": 0.0022085391502668157, "3": 0.001859776425176164, "1": 4.2214203656612704e-07}, "score": 4.011093394588691}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7662722152364548, "4": 0.23369982178917076, "3": 2.390989901618576e-05, "2": 3.498791271906894e-06, "1": 0}, "score": 4.766241732470493}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8560207007616787, "5": 0.13974154076186762, "3": 0.0031852930014926546, "2": 0.0010503981460200987, "1": 1.0356720689474627e-06}, "score": 4.134452483160956}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774770197607579, "5": 0.4224912130144992, "3": 2.581094322390772e-05, "2": 5.582007942355152e-06, "1": 0}, "score": 4.4224543961689085}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9897300468370677, "3": 0.006880437767940561, "2": 0.00273684905566629, "5": 0.0005918851176118897, "1": 4.027824745991506e-05}, "score": 3.988116670852367}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9650793384619085, "5": 0.017132209341110434, "2": 0.009170210845609159, "3": 0.008614615857119054, "1": 2.800969361950896e-06}, "score": 3.990168760778585}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9334914603813961, "5": 0.06554137869503052, "3": 0.0008250444452915737, "2": 0.00014114836313031438, "1": 0}, "score": 4.064434099903107}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6858303603201897, "4": 0.31399601005054956, "3": 0.00015567345216320144, "2": 1.6407861142869914e-05, "1": 0}, "score": 4.6856429327376325}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6442155847296946, "4": 0.3557696528886589, "3": 1.3601275266809749e-05, "2": 9.699978324879352e-07, "1": 0}, "score": 4.644200166570921}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8342465973937219, "5": 0.1642728851698232, "3": 0.0011242925337829755, "2": 0.0003537743420236307, "1": 1.2561287339341955e-06}, "score": 4.16243746958629}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8396217971684767, "5": 0.16024462901982214, "3": 0.00011030029027742331, "2": 2.1382686616400797e-05, "1": 0}, "score": 4.160091866063584}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9361468067359873, "5": 0.06370558778000243, "3": 0.00012688454239517184, "2": 2.0392201696035745e-05, "1": 0}, "score": 4.063537939721672}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9812974150332007, "5": 0.012744824644714816, "3": 0.004336208197365259, "2": 0.001620322622296088, "1": 0}, "score": 4.005167977556798}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7548445311077019, "5": 0.24506215665042239, "3": 8.88893695686389e-05, "2": 4.029501044373381e-06, "1": 0}, "score": 4.244965304641076}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5077762049030566, "5": 0.4921535734683124, "3": 5.8867935755173676e-05, "2": 1.0720647532443783e-05, "1": 0}, "score": 4.492073575742378}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9609167579528137, "5": 0.0384415105248667, "2": 0.0004011731613705861, "3": 0.00023955153183974646, "1": 0}, "score": 4.0373996503253435}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9687036496323642, "5": 0.031138929194036744, "3": 0.00011586950001684971, "2": 4.067401994195421e-05, "1": 0}, "score": 4.030941738810266}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9830156217979051, "5": 0.010751011885011793, "3": 0.003833391340849554, "2": 0.0023988750036603537, "1": 5.035891902293215e-07}, "score": 4.002118361032626}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7662843990615382, "5": 0.23370351427552558, "3": 8.659730118682192e-06, "2": 2.9463247847174125e-06, "1": 0}, "score": 4.233689074208684}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9550697027424225, "5": 0.04466920236254243, "3": 0.00022366839106742432, "2": 3.708785501613092e-05, "1": 0}, "score": 4.0443713732877615}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8925359785857134, "2": 0.0755894542178343, "3": 0.031021849505805114, "5": 0.0008012692700773961, "1": 4.663948770541737e-05}, "score": 3.818459719850467}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9116127457253328, "5": 0.08748481880874032, "3": 0.0008443740283358684, "2": 5.7460373744794e-05, "1": 0}, "score": 4.08652557604031}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9472393104230917, "5": 0.05020184499858332, "3": 0.0023849467069162, "2": 0.00017276487360618915, "1": 0}, "score": 4.047471422329472}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6791616357821427, "4": 0.32081325027275676, "3": 2.3274644705208437e-05, "2": 1.6598704513444043e-06, "1": 0}, "score": 4.67913516325372}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9943185090629039, "5": 0.0040635524510660315, "3": 0.0012011838101614498, "2": 0.0004151180169369731, "1": 8.939893272886771e-07}, "score": 4.002029452146261}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9876354707957469, "5": 0.009989791074538241, "3": 0.0016825553491797618, "2": 0.0006905193239922482, "1": 7.135117015170148e-07}, "score": 4.006924063119747}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8594403477499921, "5": 0.14029977438006458, "3": 0.0001920559158403646, "2": 6.637274849213169e-05, "1": 0}, "score": 4.13997517582005}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.940277788212817, "5": 0.05826055507193063, "3": 0.0008709249936781295, "2": 0.0005892973281908122, "1": 4.250942193516707e-07}, "score": 4.056209816871734}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5467075571307143, "5": 0.45323648399063693, "3": 4.710101534290743e-05, "2": 8.184929176656944e-06, "1": 0}, "score": 4.453173318072734}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.953245991825212, "5": 0.0459991528024816, "3": 0.0005439615466020621, "2": 0.00020971585812541574, "1": 0}, "score": 4.045035812590356}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9831236798307442, "3": 0.014468665035345616, "5": 0.00132493086269956, "2": 0.0010813770540345484, "1": 0}, "score": 3.9846934910980933}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9462952263713615, "5": 0.053386327773631344, "3": 0.00027580236985066053, "2": 4.2295663284200744e-05, "1": 0}, "score": 4.053025952520798}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9448538552283826, "5": 0.04488731683378495, "3": 0.007102204856318203, "2": 0.0031515843006359847, "1": 3.0592217634994887e-06}, "score": 4.031472828013229}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.943205489212639, "5": 0.0566438873137464, "3": 0.00011281954078432322, "2": 3.720393584488441e-05, "1": 0}, "score": 4.056456693775119}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.87977983527449, "5": 0.11906524009555644, "3": 0.0009984228240334336, "2": 0.00015552438840896773, "1": 0}, "score": 4.117755883591368}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5929866457811253, "2": 0.34859883076138193, "3": 0.05690719476849251, "5": 0.0012770423995706957, "1": 0.00022896120024721442}, "score": 3.2464843040320748}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.8812474222203194, "4": 0.062847633361558, "3": 0.05546284177634723, "1": 0.0003737058004194142, "5": 6.294230782099456e-05}, "score": 2.1809742167524413}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.958425890204013, "5": 0.021174386747932507, "3": 0.018686330719178742, "2": 0.0017111527718672761, "1": 1.3987060482172817e-06}, "score": 3.9990615535777807}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7182160858421072, "5": 0.28125746038555605, "3": 0.000502151043531516, "2": 2.3485907442358624e-05, "1": 0}, "score": 4.280708566815894}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9262029915710779, "3": 0.04133536706790021, "2": 0.029311164341167276, "5": 0.003138023926309743, "1": 9.530274852004878e-06}, "score": 3.9031514542807786}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9375789043867678, "5": 0.06184003553964191, "3": 0.0003677141823363985, "2": 0.000212816769406426, "1": 2.0337708895816953e-07}, "score": 4.061046097572672}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7307633326486405, "5": 0.26883281450834695, "3": 0.0003403485222274396, "2": 6.295817128127748e-05, "1": 1.8532310902814963e-07}, "score": 4.268366090507798}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9067044286329412, "5": 0.0926256849982981, "3": 0.00046379704706105113, "2": 0.00020580858915256905, "1": 1.0364295183904511e-07}, "score": 4.091749976092043}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7057728468019006, "5": 0.2942098766994976, "3": 1.5373935230048413e-05, "2": 1.7796621767768087e-06, "1": 0}, "score": 4.294190979596338}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8984331206277221, "3": 0.06307990644532023, "2": 0.03766673254338541, "5": 0.0008065634421069597, "1": 1.1870217808696131e-05}, "score": 3.8623573325743266}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9833554411929586, "5": 0.010262234247830298, "3": 0.004625551369945294, "2": 0.0017556612717728741, "1": 5.889585672479972e-07}, "score": 4.00212359456919}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9084295405134741, "5": 0.08994670956195909, "3": 0.0014767478613381291, "2": 0.00014621783904507932, "1": 2.268077714561943e-07}, "score": 4.088176894750465}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9201065227903558, "3": 0.05031179179634072, "2": 0.025696748823642993, "5": 0.0038796280241779964, "1": 4.472151255040389e-06}, "score": 3.902160840292721}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6859254367143299, "5": 0.31403953291360726, "3": 2.9714913504088905e-05, "2": 4.850826282500042e-06, "1": 0}, "score": 4.314000262242195}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9923152822937534, "5": 0.005372487264222373, "2": 0.0012368167960202109, "3": 0.0010745650542211289, "1": 0}, "score": 4.001824290166039}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt4", "target_model": "human", "scores": {"5": 0.692536482498503, "4": 0.3073112196803962, "3": 0.00013872472279336594, "2": 1.3313007408879507e-05, "1": 0}, "score": 4.692371311840367}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9808568035000639, "5": 0.01741229696927825, "3": 0.0015454292121451778, "2": 0.00018457512422253187, "1": 0}, "score": 4.015497731382169}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.927616765223569, "5": 0.06719632637406066, "3": 0.0047922190864738735, "2": 0.0003933692971186294, "1": 5.219150509242472e-07}, "score": 4.061615852124038}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6442141030355537, "4": 0.3557687990425166, "3": 1.5654940560988184e-05, "2": 1.0653320748860181e-06, "1": 0}, "score": 4.64419656071122}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7660917334114177, "5": 0.23364476859667793, "3": 0.00020650126906269768, "2": 5.6454305457138524e-05, "1": 0}, "score": 4.2333254852765005}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9161985373148912, "5": 0.04561483438066074, "2": 0.02766679558958467, "3": 0.010501134290358875, "1": 1.7889931310468693e-05}, "score": 3.979726422726152}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8263833739716804, "5": 0.17321936187242107, "3": 0.0002484989345405404, "2": 0.00014838549123037233, "1": 1.0055389344455328e-07}, "score": 4.172673838500172}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9435798934651364, "3": 0.02184683541926427, "5": 0.01755442015672172, "2": 0.017014327427856125, "1": 3.862005306229255e-06}, "score": 3.961667318507772}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9724284378066833, "5": 0.026736946661762788, "3": 0.0005463045247826879, "2": 0.0002878822544905742, "1": 0}, "score": 4.02561488861044}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9556330390368639, "3": 0.027969761466375614, "2": 0.016187660896818154, "5": 0.0001884586384164088, "1": 1.83706366920365e-05}, "score": 3.9397881003347326}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9655279971190657, "5": 0.024938806368496942, "3": 0.006207760972398149, "2": 0.003322775005990269, "1": 1.7812325312412413e-06}, "score": 4.012080162308629}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6925992707021525, "4": 0.3073390633381979, "3": 5.605489945752802e-05, "2": 5.0535024531296565e-06, "1": 0}, "score": 4.692533494925198}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6219397536610102, "5": 0.37722552908952517, "3": 0.0007631644645793163, "2": 6.988482696686938e-05, "1": 0}, "score": 4.376323222662311}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5926539550372673, "4": 0.40732470933018067, "3": 1.7645672302077146e-05, "2": 3.1146461739296215e-06, "1": 0}, "score": 4.59263042102124}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8591130063038374, "5": 0.14024634437239417, "3": 0.0004677951834690765, "2": 0.00017209231672343298, "1": 0}, "score": 4.139434470779946}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9696232383588795, "2": 0.01890464159558724, "3": 0.010118928501771643, "5": 0.0013482167306522917, "1": 4.031093011678749e-06}, "score": 3.953407867788739}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9258135356513504, "2": 0.0446753939430565, "3": 0.023542278244350366, "5": 0.005952418925140522, "1": 1.185562641633735e-05}, "score": 3.893023302636464}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8947658187257196, "5": 0.10357666664066782, "3": 0.0013879284045003385, "2": 0.00026906192510613153, "1": 1.852019473390363e-07}, "score": 4.101650093249869}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7121887958563423, "5": 0.2877502967797898, "3": 5.086741582536247e-05, "2": 9.708216200537407e-06, "1": 0}, "score": 4.287680108364216}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9588115981194729, "3": 0.01574179502887493, "2": 0.014788047882257344, "5": 0.010651431315877228, "1": 5.280783928289081e-06}, "score": 3.965317634116896}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9096176196191198, "2": 0.06589248370818698, "3": 0.02277183303387837, "5": 0.0017019493642635242, "1": 1.2994543751880832e-05}, "score": 3.8471056882936616}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8519043787204674, "4": 0.14803878185256927, "3": 4.382610121148959e-05, "2": 1.2754122567436959e-05, "1": 0}, "score": 4.851835265172535}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8127154505677808, "4": 0.1870977259446814, "3": 0.00015293462736542276, "2": 3.3074432701249806e-05, "1": 0}, "score": 4.812497028794914}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8932947369369755, "4": 0.10668884196942142, "3": 1.316644513574689e-05, "2": 2.324015614949452e-06, "1": 0}, "score": 4.893277753774234}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7057566989038984, "4": 0.29420313937046394, "3": 3.687930516064014e-05, "2": 3.0749097706941317e-06, "1": 0}, "score": 4.705713816222369}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8175024085308187, "5": 0.18240944880949206, "3": 7.73533246475589e-05, "2": 1.0146548089748897e-05, "1": 0}, "score": 4.182311919576388}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5621684167777294, "4": 0.4378172032045076, "3": 1.0806870161626512e-05, "2": 3.194504717973352e-06, "1": 0}, "score": 4.5621514337527715}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7548817987021457, "4": 0.2450742385125607, "3": 3.705641784632114e-05, "2": 6.339605597794093e-06, "1": 0}, "score": 4.754832490883362}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9688550165589558, "4": 0.031143793474667284, "3": 5.041510053301408e-07, "2": 2.3445199081971834e-07, "1": 0}, "score": 4.968854480809403}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9416527301687692, "4": 0.05834575345609561, "3": 9.898187414748822e-07, "2": 2.5820964615362686e-07, "1": 0}, "score": 4.941651476619847}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8585012350772834, "2": 0.07739623832652409, "3": 0.045498901325912944, "5": 0.01838321792222329, "1": 0.0002173901266286656}, "score": 3.817439118736773}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8248485625848164, "5": 0.17289766349582852, "3": 0.0017488350472510317, "2": 0.0005010496299546378, "1": 3.026269152271253e-06}, "score": 4.170137797205537}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8720735432848888, "5": 0.050760763239998896, "2": 0.04768532406603706, "3": 0.029378075914992145, "1": 9.953442437666306e-05}, "score": 3.925713230957428}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9036807713430526, "5": 0.09524726302822355, "3": 0.0009484757837659999, "2": 0.00012248414070417752, "1": 3.9597926031712256e-07}, "score": 4.094052688371543}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.930915308645762, "5": 0.047818771852414, "3": 0.013916055965984553, "2": 0.007333246171992148, "1": 1.5306821182446456e-05}, "score": 4.019190328228641}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9456955740971629, "5": 0.05335249690428254, "3": 0.0007492334056205692, "2": 0.0002016534354687078, "1": 0}, "score": 4.052200011028355}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9441243621007667, "5": 0.054954621386703505, "3": 0.0007479888399156224, "2": 0.0001721968945681467, "1": 0}, "score": 4.0538622835052545}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9606358144786343, "5": 0.014816191143609266, "3": 0.013702736795551474, "2": 0.010839757002125357, "1": 4.386253991704181e-06}, "score": 3.9794207586498462}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5234166752066056, "4": 0.4765763060947025, "3": 5.915100913918977e-06, "2": 9.656136799095811e-07, "1": 0}, "score": 4.523408901100437}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.95600646155962, "5": 0.04333734693096333, "3": 0.000580720781061776, "2": 7.499298366031126e-05, "1": 0}, "score": 4.042606660537686}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9467266877045902, "5": 0.03502757396831143, "3": 0.013716995054828535, "2": 0.0045233848715979675, "1": 3.2629789222402104e-06}, "score": 4.012254045910915}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9751066396160563, "5": 0.023660258378829464, "3": 0.0007487664041949885, "2": 0.0004834399255072057, "1": 3.7122481036506076e-07}, "score": 4.0219435099574765}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9697420962419924, "5": 0.029283671646139528, "3": 0.0008051556058766068, "2": 0.00016876969903540748, "1": 1.2758596043858644e-07}, "score": 4.028140598927697}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6926232142728029, "5": 0.3073496667187903, "3": 2.229786776475419e-05, "2": 4.322638838288489e-06, "1": 0}, "score": 4.307318876772363}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9458573283516686, "5": 0.05336161562517599, "3": 0.0006021291504702928, "2": 0.00017798914369672876, "1": 0}, "score": 4.052403557327648}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6578959637236341, "5": 0.34131195358293637, "3": 0.0006692631010743116, "2": 0.00012188177992984073, "1": 2.245126014856969e-07}, "score": 4.340398496190385}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7718374176773128, "4": 0.22815471627627704, "2": 4.0563297324374615e-06, "3": 3.57969842473786e-06, "1": 0}, "score": 4.771825902853469}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9431904329435866, "5": 0.05664298101879976, "3": 0.0001382271792366285, "2": 2.8082554801105745e-05, "1": 0}, "score": 4.056448604326912}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5774877782578511, "4": 0.4224990840991166, "3": 9.951194139249016e-06, "2": 2.8068631917947746e-06, "1": 0}, "score": 4.577472432537607}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6791428300568144, "5": 0.32080436386880146, "2": 2.9421083934878167e-05, "3": 2.2913163207292643e-05, "1": 0}, "score": 4.32072275986346}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9561839711530741, "5": 0.033757421146929395, "2": 0.005958538774668154, "3": 0.0040952398170897185, "1": 3.5633658367666226e-06}, "score": 4.017734436130222}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9698002834831378, "3": 0.018614951073467854, "2": 0.009215070843905448, "5": 0.0023666259215444556, "1": 2.2972679245133305e-06}, "score": 3.9653146145998375}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9418605739775248, "5": 0.054822855544422316, "3": 0.002262809717604772, "2": 0.0010523042452156468, "1": 6.004881074713003e-07}, "score": 4.050453679061782}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7717732420641711, "5": 0.22813575740710643, "3": 8.537647188394738e-05, "2": 5.457935244915359e-06, "1": 0}, "score": 4.228039502947018}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.730894231391438, "5": 0.268880939889237, "3": 0.00018799202805427906, "2": 3.6443916984768435e-05, "1": 9.467072676597674e-08}, "score": 4.268619856091567}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5898136142751728, "4": 0.2617282309566293, "3": 0.1445400568226314, "5": 0.0031437969180404873, "1": 0.0007704205680134242}, "score": 2.6766601146741773}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.969721023975192, "3": 0.01776105748706752, "2": 0.011114585769074755, "5": 0.0013911535276347592, "1": 1.029480663581908e-05}, "score": 3.961369967286748}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8078363888594892, "5": 0.1918779665333618, "3": 0.00023544787655070613, "2": 4.935255600557395e-05, "1": 0}, "score": 4.191543975241357}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5466863179546935, "5": 0.45321887609526945, "3": 7.887628071188848e-05, "2": 1.5290864490814374e-05, "1": 0}, "score": 4.4531097075342485}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9552852404483284, "5": 0.04068094817242619, "3": 0.0032875245954517643, "2": 0.0007450975563774685, "1": 3.6367871870022037e-07}, "score": 4.035902167067052}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9358756817208798, "5": 0.05982852649978824, "2": 0.0038849401526673856, "3": 0.0004094696795603933, "1": 4.6468875479360327e-07}, "score": 4.0516478298230325}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8303561282791109, "5": 0.16869707973215298, "3": 0.0005453811226979859, "2": 0.0003990093530983126, "1": 9.29121798148741e-07}, "score": 4.167351138944198}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9625976609937388, "5": 0.015080240021257222, "2": 0.014616269812482749, "3": 0.007702232939648159, "1": 1.8903586216266128e-06}, "score": 3.9781397590899563}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6442002461392289, "4": 0.35576115009556364, "2": 2.3135993336553486e-05, "3": 1.4937720005191288e-05, "1": 0}, "score": 4.64413937785983}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5077182201714479, "5": 0.49209737273934495, "2": 0.00010826225362807903, "3": 7.557923362593032e-05, "1": 0}, "score": 4.491805547164641}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9598277055624269, "3": 0.020552933476074144, "2": 0.019307694186560427, "5": 0.0003072416458380229, "1": 2.6581610734957116e-06}, "score": 3.9411308412935018}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9769668596858296, "5": 0.01965246309846391, "3": 0.0023841142673315984, "2": 0.0009938466886241974, "1": 9.350395584967806e-07}, "score": 4.015277877548471}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9582946188083573, "3": 0.029856580833744272, "2": 0.009845655372855193, "5": 0.002000266214560359, "1": 1.824006687365592e-06}, "score": 3.952446852457705}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8898701640391544, "5": 0.1096535202730723, "3": 0.00040170012717785365, "2": 7.430702957618925e-05, "1": 0}, "score": 4.109103239748476}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9959092124607397, "5": 0.002078779367658967, "3": 0.001222051347359155, "2": 0.0007890156516416585, "1": 0}, "score": 3.999278696038145}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9112089269326866, "5": 0.08744607161714468, "3": 0.0010340902751349434, "2": 0.00031049026802394236, "1": 0}, "score": 4.085791036916011}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9681765035007028, "5": 0.028336889706042253, "3": 0.0024376617459036863, "2": 0.0010484252526064726, "1": 2.696634869260226e-07}, "score": 4.023801574417983}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9065706814610632, "5": 0.06990721613144511, "3": 0.02165624529175765, "2": 0.001862964207200522, "1": 1.6988041425412432e-06}, "score": 4.044519999174385}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6513249540148504, "5": 0.34862912531605444, "3": 4.170055999971206e-05, "2": 3.8787562881718425e-06, "1": 0}, "score": 4.3485797862321665}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7115296640866268, "5": 0.2874839633363872, "3": 0.0008595616568464008, "2": 0.00012578166141998957, "1": 0}, "score": 4.286373133108746}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.892325689754646, "5": 0.10657311537962529, "3": 0.0008395252537543196, "2": 0.000260072791194307, "1": 4.0341541478387757e-07}, "score": 4.105212359858233}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7247754327792053, "5": 0.27509370332235983, "3": 0.00011665741445093267, "2": 1.3716734146101945e-05, "1": 0}, "score": 4.274949747096211}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9502872629910123, "5": 0.030073346435385232, "3": 0.016097102373350783, "2": 0.003536064123136443, "1": 4.339002825332355e-06}, "score": 4.006891111797543}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.787908115987357, "5": 0.21206259255208745, "3": 2.5764860255761956e-05, "2": 3.029466580440995e-06, "1": 0}, "score": 4.212030874166368}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9427622999921083, "5": 0.05661727660377362, "3": 0.0004975492556175458, "2": 0.00012192968888284567, "1": 0}, "score": 4.055875920742941}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.49955706658592447, "5": 0.49955706658592447, "3": 0.000799492345376011, "2": 8.42658395394352e-05, "1": 0}, "score": 4.498590093910098}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8077817648097344, "5": 0.19186499602123241, "3": 0.00033724081440516406, "2": 1.552841479099093e-05, "1": 0}, "score": 4.191496788369215}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8207501744918255, "5": 0.1774996751871305, "3": 0.0015598564206520651, "2": 0.00018923214806567968, "1": 0}, "score": 4.175561540873222}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8080133244023842, "5": 0.1919199924096981, "3": 5.9543584557403726e-05, "2": 7.001213967616084e-06, "1": 0}, "score": 4.1918464729467235}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7121602447798265, "4": 0.2877387582242385, "3": 9.35557539925411e-05, "2": 6.7771560883758785e-06, "1": 0}, "score": 4.712053607578386}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9791563876226647, "5": 0.015339654593768797, "2": 0.002837550780849863, "3": 0.0026656322699269396, "1": 2.8580988069138776e-07}, "score": 4.006998066754015}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9785470103690974, "3": 0.00782985255449718, "5": 0.007129161878947612, "2": 0.006491175758737353, "1": 1.9216776065758063e-06}, "score": 3.986311180758643}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9663727786364434, "5": 0.016369582367324585, "2": 0.008762006042193432, "3": 0.00849242745677641, "1": 1.958013733178122e-06}, "score": 3.9903472567433234}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.776930328457277, "5": 0.22259426592917292, "3": 0.00031438129294202423, "2": 0.00016057025264146717, "1": 0}, "score": 4.22195884491535}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9607293292414706, "2": 0.02901150800361771, "3": 0.01002611189219628, "5": 0.00021807140564005344, "1": 1.0857135981677532e-05}, "score": 3.932136092341445}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9887165421562402, "5": 0.00969303202060375, "3": 0.001122049898560725, "2": 0.0004677399868940893, "1": 2.931451377184574e-07}, "score": 4.007634625329934}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7772722763378535, "4": 0.2226922289564673, "3": 2.5417058877958052e-05, "2": 9.95346327018386e-06, "1": 5.473759879136347e-08}, "score": 4.7772268421148825}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8174395531871314, "5": 0.18239540382267264, "3": 0.000144504053341352, "2": 2.0177286840928868e-05, "1": 0}, "score": 4.1822106110921204}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5621276835300331, "5": 0.4377854801193046, "3": 7.50091088851977e-05, "2": 1.1149108705273825e-05, "1": 0}, "score": 4.437688469604034}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5312000429315396, "4": 0.46878239253988774, "3": 1.395752177039364e-05, "2": 3.1633878507231407e-06, "1": 0}, "score": 4.531179994275581}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9689850650066345, "5": 0.029260815879370742, "3": 0.0012656986712256406, "2": 0.0004879703071336131, "1": 0}, "score": 4.027019188756178}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8998868912001952, "5": 0.08112726374016675, "3": 0.014545313986812676, "2": 0.004436070131469826, "1": 3.569853497962713e-06}, "score": 4.0576991513449325}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9782820185404514, "5": 0.011935866741519342, "3": 0.007951001368071368, "2": 0.001830424448411183, "1": 2.1554804621047154e-07}, "score": 4.000323369985555}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6512185622606776, "5": 0.3485721639708465, "3": 0.00015250929697569103, "2": 5.610503494486675e-05, "1": 0}, "score": 4.348307674290793}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9661561807915777, "5": 0.029175388053698383, "3": 0.0038269788464635767, "2": 0.0008406756871587828, "1": 2.1963362933222223e-07}, "score": 4.023666412113926}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8667874222337741, "5": 0.13292615905678457, "3": 0.0002448569244108448, "2": 4.060125826857506e-05, "1": 0}, "score": 4.1326002269819035}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9835878837358283, "3": 0.008120017253463759, "2": 0.006034284438875866, "5": 0.0022548473552586245, "1": 2.1214239929045905e-06}, "score": 3.982059881778446}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9853575024593654, "5": 0.010946330423793555, "3": 0.002367309975276784, "2": 0.0013279405440192375, "1": 5.720007696646206e-07}, "score": 4.0059214253986735}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7605050172501115, "5": 0.23930351392322607, "3": 0.00016731253960014685, "2": 2.3729964108796123e-05, "1": 0}, "score": 4.239088843384471}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6653318967330708, "5": 0.33454987747219267, "3": 0.00010379487108145003, "2": 1.4047108276315739e-05, "1": 0}, "score": 4.334418116739374}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7560762107598332, "2": 0.16870340599125958, "3": 0.07486169009630642, "5": 0.00029193233850361577, "1": 6.313479588952359e-05}, "score": 3.587832531345264}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9172158291727107, "5": 0.08268952066797151, "3": 8.95434120002683e-05, "2": 4.8962693498535785e-06, "1": 0}, "score": 4.082590202100689}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9791252969635019, "3": 0.011048387381435924, "5": 0.007713017447059241, "2": 0.0021086216318618144, "1": 3.2708194765552983e-06}, "score": 3.992437563712525}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9625669517304216, "5": 0.03732276935881784, "3": 0.0001064828093923286, "2": 3.3175732204881227e-06, "1": 0}, "score": 4.037209669208859}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9893032979883707, "5": 0.010324309694971398, "3": 0.0003318740594569864, "2": 4.026089127578623e-05, "1": 0}, "score": 4.009911916403952}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8639810269221858, "2": 0.05879464497962069, "3": 0.04040892914481476, "5": 0.03679274867862548, "1": 2.1326097510549018e-05}, "score": 3.8787303906995807}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5076268238875536, "4": 0.49200878842348716, "3": 0.0003334111983097649, "2": 3.053127469127969e-05, "1": 0}, "score": 4.507232575967898}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8974182348509444, "5": 0.040681444483021384, "3": 0.03942980801944864, "2": 0.022466427391919445, "1": 3.3970335244308767e-06}, "score": 3.9563085605097883}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.77727012329663, "4": 0.2226916276882608, "3": 3.213010875498101e-05, "2": 5.583375701844723e-06, "1": 0}, "score": 4.777227242665483}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5926440577988602, "4": 0.4073179070643339, "3": 3.195167349347235e-05, "2": 5.910465292203624e-06, "1": 0}, "score": 4.5926003877134765}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9284563505598638, "2": 0.05237992352015251, "3": 0.01810201537905224, "5": 0.0010536636473014583, "1": 6.265313067467622e-06}, "score": 3.8781727882437496}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9764370262424191, "5": 0.009876520552980545, "3": 0.007691841940682073, "2": 0.0059904125266646725, "1": 2.4239914911864025e-06}, "score": 3.9901965641858896}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9804259949919656, "5": 0.01795713051055638, "3": 0.0009516930515551495, "2": 0.0006643888250355596, "1": 0}, "score": 4.015676672234587}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9576849158214278, "5": 0.04207773660093093, "3": 0.00018021463513903687, "2": 5.670705092634571e-05, "1": 0}, "score": 4.041784125659446}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9703308783005588, "5": 0.029301452230690212, "3": 0.00024189834065594325, "2": 0.00012549520591531972, "1": 0}, "score": 4.028808571427128}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.880753797591503, "5": 0.11919705869891524, "3": 4.460779225327557e-05, "2": 4.1491710112538185e-06, "1": 0}, "score": 4.11914419864322}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6990451266236788, "5": 0.3006555565132868, "3": 0.0002496276875342052, "2": 4.915460612970945e-05, "1": 0}, "score": 4.300307780148834}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7547817080117972, "5": 0.24504171931880628, "3": 0.0001609444956394461, "2": 1.5445374261499605e-05, "1": 0}, "score": 4.244849928833088}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8438196264187516, "5": 0.15609093888601794, "3": 8.237801210860828e-05, "2": 6.352310201265605e-06, "1": 0}, "score": 4.155995966132841}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6150824223956435, "4": 0.38490874452405055, "3": 7.399308559686084e-06, "2": 1.2462469039080363e-06, "1": 0}, "score": 4.615072645934677}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9806782704627299, "5": 0.009919421261121377, "2": 0.005066344638544144, "3": 0.004333474213107746, "1": 1.699568776435111e-06}, "score": 3.995448155469296}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9563276447629262, "5": 0.04335190639092185, "3": 0.00026183919556888556, "2": 5.842422164042148e-05, "1": 0}, "score": 4.0429732267205525}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9804222105549288, "5": 0.010891506648999894, "2": 0.006402786453557432, "3": 0.002282983816862273, "1": 1.847712986751704e-07}, "score": 3.995802394235343}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9621988489369778, "5": 0.037308496129467225, "3": 0.00042761641109552, "2": 6.456042183658474e-05, "1": 0}, "score": 4.036751776445746}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9045998081690918, "5": 0.09534412156153356, "3": 5.031848768391353e-05, "2": 5.645577853821311e-06, "1": 0}, "score": 4.095282522037512}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8927470383135541, "5": 0.1066234297633449, "3": 0.0004495776371755779, "2": 0.00017882962876080924, "1": 4.945082512383012e-07}, "score": 4.10581477602296}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6924612355725542, "5": 0.30727781676629823, "3": 0.00022869347229431867, "2": 3.095029584731605e-05, "1": 0}, "score": 4.306987622981324}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9868079144903582, "2": 0.007653019524009168, "3": 0.005426803458789017, "5": 0.00010916446060060493, "1": 1.46280460880907e-06}, "score": 3.9793718998076257}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6150779753658057, "5": 0.3849059500967091, "3": 1.1823978643018945e-05, "2": 3.838683840448533e-06, "1": 0}, "score": 4.384886607275558}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9045914171401889, "5": 0.0953432253310032, "3": 5.1110428568555424e-05, "2": 1.375618523121046e-05, "1": 0}, "score": 4.095264649298818}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9754645011463811, "2": 0.012279288471525871, "3": 0.007805190639568234, "5": 0.004447263570176548, "1": 2.3840353043480366e-06}, "score": 3.972076305566508}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9699514376658266, "3": 0.01668893256357337, "2": 0.011650752602313887, "5": 0.0017048817934583308, "1": 2.445810492972002e-06}, "score": 3.9617070472563847}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9291101582169594, "3": 0.05001646638852391, "2": 0.016753417695538772, "5": 0.004105601574674267, "1": 1.2665193453154652e-05}, "score": 3.9205441698604}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9782748281940397, "5": 0.021612906923391347, "3": 9.402357587126561e-05, "2": 1.8227301599587613e-05, "1": 0}, "score": 4.021482429045184}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9336746424456585, "2": 0.03735167957027633, "3": 0.02819452694044832, "5": 0.0007752093779516833, "1": 2.97615904464616e-06}, "score": 3.89786829621098}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9728181737958429, "3": 0.010312144506628734, "5": 0.009994873174547232, "2": 0.0068693691757418015, "1": 3.981674892219602e-06}, "score": 3.9859320247852597}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9961187595596234, "5": 0.002393164811719002, "3": 0.0012033588386211956, "2": 0.00028139139302974387, "1": 1.0470708068956106e-06}, "score": 4.0006238833960275}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9460653518712502, "5": 0.044248071075166394, "2": 0.005367897361132144, "3": 0.004313226702915618, "1": 4.387749959363345e-06}, "score": 4.0291859174901035}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8221569708929791, "5": 0.17780392158268166, "3": 2.906941405335411e-05, "2": 9.437456997082898e-06, "1": 0}, "score": 4.17775608402441}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9625666215700137, "3": 0.019977432850054874, "2": 0.016561873539189153, "5": 0.0008915696472897625, "1": 1.259208763159989e-06}, "score": 3.9477865471816016}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6278321972813403, "2": 0.3360543419843092, "3": 0.030296223839267472, "5": 0.005347602229175904, "1": 0.00046002395212489146}, "score": 3.3015559100186747}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8009407938011674, "2": 0.15771458556103538, "5": 0.023442182700185436, "3": 0.017695091398179486, "1": 0.0002060083203380115}, "score": 3.6896994799688407}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8271875219706931, "3": 0.07938276498272269, "5": 0.06279693578066052, "2": 0.030604782236378705, "1": 2.5410476712135935e-05}, "score": 3.922128173631194}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8215195285233152, "5": 0.17766605256012344, "3": 0.0006928309693482496, "2": 0.00012039590949026996, "1": 4.6221993932493286e-07}, "score": 4.176731172093528}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9262798927667698, "2": 0.02797122712027625, "5": 0.027110642934057783, "3": 0.018632854229708142, "1": 4.295987974471953e-06}, "score": 3.952522394893559}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt4", "target_model": "human", "scores": {"2": 0.6700187579826526, "4": 0.2793053922265111, "3": 0.04930033020922704, "5": 0.0009612031278478937, "1": 0.0004069990120175227}, "score": 2.6103921915430774}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9490440947646143, "5": 0.039171728661337, "3": 0.010542927742609176, "2": 0.0012396514841991392, "1": 0}, "score": 4.026149539720224}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5846632725217119, "5": 0.41458834118922744, "3": 0.0006953506550475823, "2": 5.1969996307215856e-05, "1": 0}, "score": 4.41378949149125}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6075502263898898, "5": 0.3922638966316474, "3": 0.00016122720123088802, "2": 2.3964284064771156e-05, "1": 0}, "score": 4.392055009613316}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9211660093011157, "5": 0.07801415456296866, "3": 0.0007073464385436835, "2": 0.00011191845860439524, "1": 0}, "score": 4.0770830152400235}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9093203378588104, "5": 0.07945553674556788, "3": 0.009197643215252708, "2": 0.002020454081518916, "1": 3.4962922784148586e-06}, "score": 4.066206664112909}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5543433604588612, "5": 0.4454274037033469, "3": 0.00014710763915384763, "2": 8.124055416040982e-05, "1": 0}, "score": 4.445118210062593}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8735929360915308, "5": 0.10433580367439825, "3": 0.012657365250493822, "2": 0.00940615515756969, "1": 6.275295389691204e-06}, "score": 4.072847408909857}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7662737477824179, "4": 0.23370028918928176, "3": 2.177025433425255e-05, "2": 3.6098620487222175e-06, "1": 0}, "score": 4.766245204457447}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9700849121664844, "5": 0.02667251352025788, "3": 0.002767677660885518, "2": 0.00047349381865795763, "1": 4.892598979555287e-07}, "score": 4.0229564014147305}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9642800251815545, "5": 0.0329958461394713, "3": 0.001694913452373441, "2": 0.0010280169744238802, "1": 5.597654389393731e-07}, "score": 4.029243238113352}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9590161402004724, "5": 0.04083982788776553, "3": 9.50985343693634e-05, "2": 4.857157862868738e-05, "1": 0}, "score": 4.040647600902391}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9586565631490995, "5": 0.04082451582349911, "3": 0.0003587633783563903, "2": 0.00015920036370141078, "1": 0}, "score": 4.040147390150247}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7310565956496217, "4": 0.2689406918722799, "3": 1.704881416649043e-06, "2": 8.05328957614726e-07, "1": 0}, "score": 4.731053427978803}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5234113520860869, "4": 0.4765714593383153, "3": 1.4189440453815473e-05, "2": 2.750748504132622e-06, "1": 0}, "score": 4.523391791152153}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9715747230414685, "5": 0.021464879309204293, "3": 0.004864885982005485, "2": 0.0020923613881855254, "1": 2.1620320816095974e-06}, "score": 4.012408796717541}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9593312421836268, "5": 0.024016384357325834, "2": 0.011523190602946213, "3": 0.005113384833608959, "1": 1.4362441326282618e-05}, "score": 3.995813524983821}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7477489766839478, "5": 0.2504645463526742, "3": 0.0013773925825194253, "2": 0.0004071564696857207, "1": 1.2365466787374346e-06}, "score": 4.248269302835328}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.90874121255213, "5": 0.08997755757725782, "3": 0.001097802307411692, "2": 0.00018203346757828364, "1": 5.44270212095987e-07}, "score": 4.08851413074561}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9920196737347722, "5": 0.00668417624769991, "3": 0.000682831591868461, "2": 0.0006120862830583459, "1": 7.629006681864311e-07}, "score": 4.004774885628287}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9857413365025236, "5": 0.007526227189367811, "3": 0.0037844246937976164, "2": 0.0029473129150043454, "1": 3.111125789739229e-07}, "score": 3.997846242493057}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9740116640506127, "5": 0.025157933119192653, "3": 0.0004982258847212682, "2": 0.00033188998979416523, "1": 0}, "score": 4.023995934140652}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9861405400392119, "5": 0.011302780743972953, "3": 0.0022256494907614208, "2": 0.00033081342903728796, "1": 1.0589360217477177e-07}, "score": 4.008415187643395}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8030934545911916, "5": 0.19680651307860456, "3": 7.840216626958783e-05, "2": 2.1433959525647342e-05, "1": 0}, "score": 4.196685281583802}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8961157671006197, "5": 0.10054139959870004, "2": 0.0019298538583393924, "3": 0.001411911244344078, "1": 4.886785136383291e-07}, "score": 4.095268369812013}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9370001749788772, "5": 0.0618018611052658, "3": 0.0008678891142711543, "2": 0.0003294134201020767, "1": 2.7350470836610377e-07}, "score": 4.060274348015685}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7632465404758175, "2": 0.18128695796854696, "3": 0.05528938731457433, "5": 0.0001267493555403737, "1": 4.590557447568563e-05}, "score": 3.5821238659407846}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9866574880770715, "5": 0.006648044684210094, "3": 0.0035032733664539595, "2": 0.003189766698903043, "1": 7.354321877498653e-07}, "score": 3.9967630293842413}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9955581742179381, "5": 0.002144011225527946, "3": 0.0019218792415239797, "2": 0.0003725732854620128, "1": 2.433142320460724e-06}, "score": 3.9994696854935157}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9986309382213141, "3": 0.0007549417228292874, "2": 0.0003510805056399489, "5": 0.0002609008781443311, "1": 1.2272373152196793e-06}, "score": 3.998800115338473}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9871861435912224, "5": 0.009380272173691025, "3": 0.0028608213787955955, "2": 0.0005722002731387419, "1": 0}, "score": 4.005375053272532}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9638008546749959, "5": 0.03510644665465327, "2": 0.0005586454743784396, "3": 0.0005330632355654264, "1": 2.813276029182509e-07}, "score": 4.033455272195026}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7247057997008505, "5": 0.27506729559443216, "3": 0.0001644976950024795, "2": 6.146829773764846e-05, "1": 0}, "score": 4.274780119243343}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7370021128293225, "5": 0.2627861750789293, "3": 0.00018662412325739014, "2": 2.4100234192108607e-05, "1": 0}, "score": 4.262551609818518}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7825014371156457, "5": 0.21729280568979864, "3": 0.0001776164691509008, "2": 2.7667309615260714e-05, "1": 0}, "score": 4.217059957361029}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9558791213764997, "3": 0.027976964607317804, "4": 0.01474282139132431, "1": 0.0013928907710516584, "5": 6.350360341352631e-06}, "score": 2.056088871548118}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9392442654529852, "5": 0.060043871036687034, "3": 0.000646504758097411, "2": 6.502075703802241e-05, "1": 0}, "score": 4.059267344796591}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5077260238604631, "5": 0.4921049363340901, "3": 0.00016252332955611444, "2": 6.107830020438208e-06, "1": 0}, "score": 4.491930398369818}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7825071259217723, "5": 0.21729437020363185, "3": 0.00018325572064073503, "2": 1.4579735103981656e-05, "1": 0}, "score": 4.217082100114551}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9742392665162898, "5": 0.025163813215225064, "3": 0.0005388365391139487, "2": 5.768732957413994e-05, "1": 0}, "score": 4.024509611732569}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9845202424170615, "2": 0.011284211981436613, "3": 0.0022925267165693265, "5": 0.0019005714022424774, "1": 1.994781574664955e-06}, "score": 3.9770336259811727}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8395265138976675, "5": 0.160226442286545, "3": 0.0001905602767614049, "2": 5.63295102160268e-05, "1": 0}, "score": 4.159923247622139}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9478643790831974, "5": 0.05182960333515234, "3": 0.0002118157002138781, "2": 9.399264720284883e-05, "1": 0}, "score": 4.05142981310141}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8774489780543415, "5": 0.12251933802838008, "3": 2.2697948772608543e-05, "2": 8.75083879415582e-06, "1": 0}, "score": 4.1224791672005106}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9457988875245539, "5": 0.05335832331506071, "3": 0.0005149967335201363, "2": 0.0003273518407194878, "1": 1.4777130422833692e-07}, "score": 4.052188194867667}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt4", "target_model": "human", "scores": {"4": 0.869503734673812, "5": 0.12924018585059313, "3": 0.001066943244218438, "2": 0.00018832666936775372, "1": 2.9672575754103186e-07}, "score": 4.127795764628667}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7771306469158932, "5": 0.22265165812846607, "3": 0.00017639725072009978, "2": 4.0608952936063644e-05, "1": 1.464587526514049e-07}, "score": 4.222393724198227}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8433729674978357, "5": 0.15600831061164397, "3": 0.0005123021347683415, "2": 0.00010571952090216933, "1": 2.2414537501393865e-07}, "score": 4.15528397092801}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6790401785852167, "5": 0.3207558619158245, "3": 0.00017194687416414986, "2": 3.1313852075360176e-05, "1": 0}, "score": 4.320521511309198}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.615060341333037, "5": 0.38489493809500425, "3": 3.876820911089554e-05, "2": 5.762379851061767e-06, "1": 6.204474615704094e-08}, "score": 4.384844508228285}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9826324118388344, "5": 0.01539411477609083, "3": 0.0015005928734464025, "2": 0.00047218249743471617, "1": 0}, "score": 4.012949165946476}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9921705709065387, "5": 0.006479512518981506, "3": 0.0007738674130633306, "2": 0.0005750894293246985, "1": 0}, "score": 4.004555470619301}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.925220871475129, "3": 0.04327315556878914, "2": 0.026246495594985094, "5": 0.005249630950459478, "1": 8.143031720949555e-06}, "score": 3.909458900870738}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9796173193871823, "5": 0.020331310338006524, "3": 4.588629818271081e-05, "2": 5.229373901290381e-06, "1": 0}, "score": 4.020274970454085}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.4605745256533906, "4": 0.3586958012416014, "3": 0.18036357574986545, "1": 0.0002931998791874862, "5": 4.9382917162616215e-05}, "score": 2.897631234507806}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt4", "target_model": "human", "scores": {"4": 0.961113496007907, "5": 0.03726641351242316, "3": 0.0012751862915822815, "2": 0.0003432117343288795, "1": 4.923691977174868e-07}, "score": 4.0353033690116185}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5621634359876218, "4": 0.4378133241612714, "3": 1.673784892941218e-05, "2": 5.875537574955678e-06, "1": 0}, "score": 4.56213529922141}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.933255087334548, "2": 0.04503448271954133, "3": 0.021607780949833618, "5": 9.110917912432832e-05, "1": 0}, "score": 3.88841307509752}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7606342456358791, "4": 0.23934417504430602, "3": 1.3736177667642949e-05, "2": 7.015753061452836e-06, "1": 0}, "score": 4.760607107270107}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.8175654976259464, "4": 0.1824235313625197, "3": 8.153608238798486e-06, "2": 2.194513886440804e-06, "1": 0}, "score": 4.817553464235329}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8654352408365161, "2": 0.09121620602916525, "3": 0.03923160135266371, "5": 0.004070873432384473, "1": 4.3831930470587855e-05}, "score": 3.7822748751281647}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7540573747773561, "2": 0.20295177291749675, "3": 0.042540998391911035, "5": 0.00038571507836843605, "1": 5.823424349788519e-05}, "score": 3.551763821469499}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9747030543626923, "5": 0.014800084333778883, "3": 0.008700520739481753, "2": 0.0017954539357782125, "1": 4.012235835736071e-07}, "score": 4.00250745326912}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9633677447384241, "2": 0.018782680194928267, "5": 0.012708998412419823, "3": 0.005134899537797039, "1": 4.682422283451345e-06}, "score": 3.9699946613717816}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9652221431304069, "3": 0.013984971363339397, "2": 0.010556410217730775, "5": 0.010231623619790327, "1": 3.029018252564173e-06}, "score": 3.975124699427253}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt4", "target_model": "human", "scores": {"4": 0.850118837879653, "5": 0.1477285072917121, "3": 0.001258286631094501, "2": 0.0008922588293874367, "1": 1.0125850920157186e-06}, "score": 4.144682823932237}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7490769378345083, "4": 0.25090934007933285, "3": 1.104078957718699e-05, "2": 2.314275218517548e-06, "1": 0}, "score": 4.749061543416083}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8175253316197341, "4": 0.1824145563455639, "3": 4.91701906098622e-05, "2": 1.0468937695262052e-05, "1": 0}, "score": 4.817455610133721}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7185796885569936, "4": 0.2813998408125852, "3": 1.5652905550993764e-05, "2": 4.212922376052746e-06, "1": 0}, "score": 4.718556044391178}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.665401454165259, "4": 0.33458487321962194, "3": 1.0278152828770188e-05, "2": 3.1840232113877297e-06, "1": 0}, "score": 4.665384947989003}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.41159817868318466, "2": 0.33072842786124246, "3": 0.25757155860231024, "5": 8.374718498026001e-05, "1": 1.304529533399755e-05}, "score": 3.081011563091749}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8077509000581758, "5": 0.19185764773260539, "3": 0.00031679616611720305, "2": 7.407910864712257e-05, "1": 1.7521500800218172e-07}, "score": 4.191392244590156}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.873047600001072, "5": 0.12577445698078524, "3": 0.0009454117604758451, "2": 0.0002316831158312728, "1": 2.3939761650298115e-07}, "score": 4.124365036502294}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6297232133659012, "5": 0.3701951647911591, "3": 6.966238889318133e-05, "2": 1.1372072373634326e-05, "1": 0}, "score": 4.370102975649224}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8437735382494359, "5": 0.15608241655341656, "3": 0.00012758267144478503, "2": 1.622031644355983e-05, "1": 0}, "score": 4.155922431014941}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8926206030408238, "5": 0.10014926058229112, "2": 0.0047578061968154345, "3": 0.002468317338413571, "1": 1.7529350561031604e-06}, "score": 4.088160271279057}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9196387675603632, "4": 0.08035714237169533, "3": 2.4302291612915723e-06, "2": 1.3632350086133627e-06, "1": 0}, "score": 4.919633883628064}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8383204693046201, "5": 0.15999625024366992, "3": 0.0011475741492895264, "2": 0.0005336715410058289, "1": 0}, "score": 4.157781654060391}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6653769678422967, "4": 0.3345725272655844, "3": 3.9398768440667555e-05, "2": 1.027778282192852e-05, "1": 0}, "score": 4.665317564617934}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7772633377580725, "4": 0.22268969027952767, "3": 3.5843403881324864e-05, "2": 1.026930714779673e-05, "1": 0}, "score": 4.777207623556612}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9831423485435501, "5": 0.012570832870287547, "3": 0.003330939109112403, "2": 0.0009543300328099116, "1": 8.303853224234035e-07}, "score": 4.007328747809389}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9913633737958353, "5": 0.003865945482810124, "3": 0.0034116849141408423, "2": 0.0013570744988065063, "1": 1.0100113394458724e-06}, "score": 3.9977370794748452}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9502912456532772, "2": 0.025324403067595373, "3": 0.023058131388809907, "5": 0.001321335911498332, "1": 3.486500663429924e-06}, "score": 3.9276038377134523}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9851654153933108, "5": 0.014052632980673947, "3": 0.0006370289219803334, "2": 0.0001443786782437157, "1": 0}, "score": 4.013126853843554}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9895511801827095, "5": 0.006879192521402772, "3": 0.002652164977189684, "2": 0.0009165636904252774, "1": 0}, "score": 4.002393902314591}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5954153200775295, "5": 0.3966321111846184, "3": 0.006022541094519883, "2": 0.0019249197508143562, "1": 4.0179188033548465e-06}, "score": 4.38674809837732}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.850013395678663, "5": 0.14771019009249778, "2": 0.0011819044509800525, "3": 0.0010930829288238516, "1": 9.967628090025235e-07}, "score": 4.144250370013385}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6149375752413914, "5": 0.38481808994653993, "3": 0.0002265635677723842, "2": 1.71998481959616e-05, "1": 0}, "score": 4.384557346416945}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9098199683696336, "5": 0.09008437030034616, "3": 8.882139520442827e-05, "2": 6.63844372972649e-06, "1": 0}, "score": 4.0899822901483125}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7545577824066416, "5": 0.24496905072214195, "3": 0.0003514305668784109, "2": 0.00012145108121539212, "1": 0}, "score": 4.2443747876941735}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6432111667676326, "5": 0.35521490729814775, "3": 0.0012224389212880016, "2": 0.0003502346148176088, "1": 3.9746577785691566e-07}, "score": 4.353291108789884}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6718910362795408, "4": 0.32745353887542633, "3": 0.0005240574197348409, "2": 0.00013044824498727702, "1": 0}, "score": 4.671106699237895}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8214625088317317, "4": 0.17765372296391774, "3": 0.0007850257799660716, "2": 9.673415616820039e-05, "1": 6.517896172625907e-07}, "score": 4.820483172338442}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9124268200015846, "4": 0.08756294261947875, "3": 8.156894805117358e-06, "2": 1.7367031211884826e-06, "1": 0}, "score": 4.91241550337166}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6925263715396687, "4": 0.3073067022386701, "3": 0.0001224223018287521, "2": 4.3651015995197564e-05, "1": 0}, "score": 4.692317237685878}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5432236855234649, "2": 0.3193447623754703, "3": 0.137348470814164, "1": 4.261266706264449e-05, "5": 3.879927488657552e-05}, "score": 3.223871670082685}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6943044402174641, "2": 0.18112012388020318, "3": 0.12448191931615636, "1": 5.116427619563824e-05, "5": 3.408275568399297e-05}, "score": 3.5131543968543855}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.866154586499156, "2": 0.08056493288588681, "3": 0.051210187096469975, "5": 0.002048664830943239, "1": 1.946647115998677e-05}, "score": 3.789649757726479}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9598062987638286, "5": 0.03839708629506495, "3": 0.0014888166041374133, "2": 0.0003072345793614332, "1": 3.2246410797657866e-07}, "score": 4.036292841897107}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9856626962099984, "3": 0.00966309778971628, "2": 0.00390424443877589, "5": 0.000768791312846019, "1": 4.818218003848801e-07}, "score": 3.9832957476805206}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.801499284206742, "5": 0.19641584679260723, "3": 0.0018957400291077287, "2": 0.00018770358780187806, "1": 0}, "score": 4.194144976318988}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9415660682061667, "5": 0.05654544092033857, "3": 0.001629331126860593, "2": 0.00025779754252269125, "1": 6.390162196673591e-07}, "score": 4.05439863700021}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9490826457187083, "5": 0.0457982499175169, "3": 0.004464337731798765, "2": 0.0006532769494462673, "1": 5.957117069971557e-07}, "score": 4.04002560693343}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8079625908385418, "5": 0.19190792102182463, "3": 0.00012027376963859795, "2": 8.712602650213565e-06, "1": 0}, "score": 4.19177031827097}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7538710852963464, "5": 0.24474610791157578, "3": 0.0013045345089004185, "2": 7.712878505922547e-05, "1": 3.30334849991139e-07}, "score": 4.24328652265967}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8989592802771714, "5": 0.07733237409537365, "2": 0.01430505510983346, "3": 0.009381484183149992, "1": 1.9582132786626573e-05}, "score": 4.039282120665555}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.724755711907983, "5": 0.27508624838401474, "3": 0.00012035738896284614, "2": 3.72849797530766e-05, "1": 1.4314324425275597e-07}, "score": 4.274890961482007}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9056772387781498, "5": 0.06560704470513946, "2": 0.015583034321886069, "3": 0.013122230530101095, "1": 8.485115899766102e-06}, "score": 4.021293332057944}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6001484726266652, "5": 0.39978507051371004, "3": 5.6787007477262973e-05, "2": 9.270224136352562e-06, "1": 0}, "score": 4.399709902793234}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8306202899664413, "5": 0.16875075080914803, "3": 0.0003361064609907836, "2": 0.0002920145290246776, "1": 0}, "score": 4.167830755971621}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9204775477222643, "5": 0.07795585297686569, "3": 0.0011294912148466618, "2": 0.00043545765476685596, "1": 4.865199154409708e-07}, "score": 4.075954075296549}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9893140349553278, "5": 0.008694030832591352, "3": 0.0012139587081248725, "2": 0.0007716391033120813, "1": 0}, "score": 4.005936831535985}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7874222053651458, "5": 0.2119318114823106, "3": 0.0005012698395385421, "2": 0.0001436162135491301, "1": 0}, "score": 4.211143540861138}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7548606774049064, "5": 0.24506737652995056, "3": 6.109399366340983e-05, "2": 1.0289907473953466e-05, "1": 0}, "score": 4.24498584044356}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9040803724179697, "5": 0.0952893716237961, "3": 0.0004277006598267334, "2": 0.00020203148628741144, "1": 1.5513626146328098e-07}, "score": 4.0944571774066905}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8791930419444176, "3": 0.06172903964770732, "4": 0.056204930197276445, "1": 0.0027548948612255994, "5": 0.00011194521031270356}, "score": 2.1717208965759247}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.6502049422620216, "4": 0.25462393170654546, "3": 0.09367090970507944, "5": 0.001235730976735606, "1": 0.0002631022021346489}, "score": 2.606363702536672}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7527933834522935, "5": 0.24439622446090284, "3": 0.0024337071694868853, "2": 0.000373221082286926, "1": 2.5147453802374006e-06}, "score": 4.24120875981944}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.546623725954748, "5": 0.45316698550474954, "3": 0.00018919279187206792, "2": 1.9631620517023658e-05, "1": 0}, "score": 4.452938739693447}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9624294540498816, "5": 0.019059881461579515, "3": 0.01630278543803031, "2": 0.002206342084801557, "1": 9.959736853919918e-07}, "score": 3.998341423035613}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.874873477694707, "2": 0.11475842640663204, "3": 0.009273902558713243, "5": 0.0010405030300762853, "1": 5.180359549537766e-05}, "score": 3.7620938880107313}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9365749202789337, "2": 0.04519468443748869, "3": 0.017698498031151554, "5": 0.0004790763876953093, "1": 4.597554193230605e-05}, "score": 3.8922525452896615}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9687888876789957, "5": 0.024635088267023427, "3": 0.0034398283744145365, "2": 0.003131999376273475, "1": 3.339017352837298e-06}, "score": 4.014921256879786}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6584076043132453, "4": 0.34157735850071463, "3": 1.3058699734286953e-05, "2": 1.465145504425835e-06, "1": 0}, "score": 4.6583919533019555}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.8269182666328024, "4": 0.14825827867485583, "3": 0.02458363257406655, "1": 0.00019365661364841429, "5": 4.2540712474061766e-05}, "score": 2.3210353191338577}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9768096363608674, "5": 0.019044755826602415, "2": 0.002136761957111556, "3": 0.0020073020946334836, "1": 9.797552905336548e-07}, "score": 4.0127609977491465}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6583136233357815, "5": 0.3415285847364504, "3": 0.00014483013283111387, "2": 1.1343972640284541e-05, "1": 0}, "score": 4.341361618920777}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6915948650087111, "5": 0.30689334566883547, "3": 0.0009175944872125861, "2": 0.0005924435285271634, "1": 8.499145686362751e-07}, "score": 4.304788589114903}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5850684675802763, "5": 0.41487566751034854, "3": 4.17880142492513e-05, "2": 1.3566581932025312e-05, "1": 0}, "score": 4.414806958013699}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6856303122106098, "5": 0.31390443077190494, "3": 0.00039741018463672654, "2": 6.693476965874884e-05, "1": 0}, "score": 4.313373436864326}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7719580266961591, "2": 0.1427978764479357, "3": 0.07886048503249686, "5": 0.0063729022558178935, "1": 8.068241542369403e-06}, "score": 3.6418915137215495}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7549103337734461, "4": 0.24508350249386462, "3": 5.015226364908757e-06, "2": 1.003108378986443e-06, "1": 0}, "score": 4.754903422091729}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9622488470503321, "5": 0.025643062802194205, "3": 0.007580076401690191, "2": 0.004526270354068884, "1": 9.209528466436269e-07}, "score": 4.0090076902421}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6370065378257034, "4": 0.3629553699761798, "3": 2.183000845699651e-05, "2": 1.5971175367176008e-05, "1": 0}, "score": 4.636952950828924}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5389548380435525, "4": 0.4609925023502813, "3": 4.64330995813999e-05, "2": 5.903306147587471e-06, "1": 0}, "score": 4.538896772503349}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9622649629289766, "2": 0.016299994640062432, "3": 0.014841314010215866, "5": 0.006585793170101935, "1": 5.820697255769273e-06}, "score": 3.9591269413597305}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9678023194544403, "3": 0.018288603000591017, "5": 0.011267281450923098, "2": 0.00263472306811896, "1": 4.559251922405752e-06}, "score": 3.9876955236276532}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6887443788001538, "2": 0.15855795592115257, "3": 0.14895141500533401, "5": 0.003614199089222475, "1": 0.00012367109203693027}, "score": 3.5371719804240422}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5923113223368635, "5": 0.4070892215486299, "3": 0.000548623798488358, "2": 4.945991571385165e-05, "1": 4.84887951759425e-07}, "score": 4.406440583975898}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.802142913986638, "2": 0.16296521595455535, "3": 0.032089753673624745, "5": 0.0027604998792010054, "1": 3.699071954091377e-05}, "score": 3.644627698261468}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9056065443721293, "3": 0.059731222819287985, "2": 0.03350617931490176, "5": 0.001146518866576661, "1": 7.2571309005392265e-06}, "score": 3.8743808799277146}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.4999779757650538, "5": 0.4999779757650538, "3": 3.5710456960864935e-05, "2": 7.6031950325132106e-06, "1": 0}, "score": 4.499927426273649}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6075118061284343, "5": 0.39223911418154406, "3": 0.00019752735043417508, "2": 5.07292190879559e-05, "1": 0}, "score": 4.391940451007153}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5078070634006545, "4": 0.49218348254975025, "3": 7.141926500570792e-06, "2": 1.9832413624976063e-06, "1": 0}, "score": 4.5077961219962965}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.968622778846644, "5": 0.030178362044338564, "3": 0.00100087566215057, "2": 0.0001970841033051759, "1": 3.3055095964318694e-07}, "score": 4.028782342893882}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9756282163603766, "1": 0.01902172180379953, "3": 0.005119627993960448, "4": 0.00022848317105321188, "5": 0}, "score": 1.9865548463051985}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8438302332981198, "5": 0.1466356999111382, "3": 0.007532306319014901, "2": 0.0019958624825188146, "1": 4.795037639118174e-06}, "score": 4.135097432520093}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9261616792080147, "3": 0.033212419223850945, "2": 0.022826539655263937, "5": 0.01777732695833003, "1": 1.925081808906988e-05}, "score": 3.938853905730614}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6651017450196798, "5": 0.3344341766811805, "3": 0.0003621541891302309, "2": 0.00010056663654367293, "1": 2.571927585286779e-07}, "score": 4.33387048499194}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7421302812706835, "5": 0.2564733803676333, "3": 0.0008826290037088476, "2": 0.0005108264773942546, "1": 1.9307442647099238e-06}, "score": 4.254563548555542}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt4", "target_model": "human", "scores": {"5": 0.6074972503199387, "4": 0.392229716244956, "3": 0.00018847748522257503, "2": 8.363637707836415e-05, "1": 3.753968889957593e-07}, "score": 4.607140704281242}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.957128091086934, "5": 0.03828994308168675, "3": 0.0029991001059372995, "2": 0.001580414696882828, "1": 8.211434638057307e-07}, "score": 4.032127602515893}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9223787426397194, "5": 0.0647611559875015, "3": 0.007856417226976796, "2": 0.00499384262717968, "1": 6.943712389685985e-06}, "score": 4.046896358265555}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6150670455272953, "4": 0.38489912192572046, "3": 2.6645267576176273e-05, "2": 6.4284699688316625e-06, "1": 0}, "score": 4.61502801000884}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7602507392862096, "5": 0.23922350420654034, "3": 0.0004406621834440839, "2": 8.410184946220537e-05, "1": 0}, "score": 4.2386148751433135}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5926407093693931, "5": 0.4073156057246603, "3": 3.976426155311819e-05, "2": 3.816060309983917e-06, "1": 0}, "score": 4.407268251936264}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9867192389815945, "5": 0.010297340715939395, "3": 0.002445832801354936, "2": 0.0005372781646950034, "1": 1.1278922787552918e-07}, "score": 4.006776614549436}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9719545469618698, "5": 0.02358377743825754, "3": 0.003560618547190605, "2": 0.0009002653542865563, "1": 4.826032255911737e-07}, "score": 4.018221186004897}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5621636383664951, "4": 0.4378134817740964, "3": 1.8097947932768338e-05, "2": 4.575877840216494e-06, "1": 0}, "score": 4.562136504481909}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7184143839445924, "5": 0.28133512629165347, "3": 0.00023726485717268943, "2": 1.317804329602965e-05, "1": 0}, "score": 4.281071518519823}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9113093021240505, "5": 0.08476497094529416, "3": 0.002442463787879059, "2": 0.0014814291725865033, "1": 8.721991989175884e-07}, "score": 4.079357108538011}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8986931827732719, "5": 0.1008305695476288, "3": 0.0004185607990885155, "2": 5.66460669548094e-05, "1": 0}, "score": 4.1002988210069535}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8795912922683287, "5": 0.1190397509563617, "3": 0.0010625878268682686, "2": 0.0003044365094830044, "1": 8.685653581829838e-07}, "score": 4.117365809276839}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.724650398060218, "5": 0.2750462537511799, "3": 0.00021452892075288384, "2": 8.80424916822402e-05, "1": 2.5514316958213287e-07}, "score": 4.2746550176866736}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.47522053427934463, "4": 0.3266139456101151, "3": 0.19810137190224927, "1": 3.8461531423216796e-05, "5": 2.1914720017797623e-05}, "score": 2.851359757043377}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9833986724151228, "3": 0.006033119934357467, "2": 0.005324209654991842, "5": 0.005241665435209263, "1": 1.4807068246090222e-06}, "score": 3.9885556743215056}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7247686054267853, "5": 0.27509111745370224, "3": 0.00011306722552431588, "2": 2.6855820019386398e-05, "1": 0}, "score": 4.274924435931726}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.711707212886108, "5": 0.2875557282895295, "3": 0.0005817533484357412, "2": 0.0001541492914715187, "1": 2.667473183129229e-07}, "score": 4.28666513108681}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8311381187962269, "4": 0.16885594905342047, "3": 4.039724747981631e-06, "2": 1.710527081754817e-06, "1": 0}, "score": 4.831130809198782}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6076529718200535, "4": 0.3923302576050545, "3": 1.3236571382721987e-05, "2": 3.452965952056181e-06, "1": 0}, "score": 4.60763287855785}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8927424853152688, "5": 0.10662287532295169, "3": 0.0004785705107682502, "2": 0.00015536909712585812, "1": 0}, "score": 4.105833640675433}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9046447715153768, "4": 0.09534885074724586, "3": 3.7026454770614396e-06, "2": 2.0130934281282693e-06, "1": 0}, "score": 4.904637641551779}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.736967857767212, "4": 0.2627739558058884, "2": 0.00015714588189431593, "3": 9.988799996452836e-05, "1": 0}, "score": 4.736554526915726}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9539647098400325, "4": 0.04603383082907279, "3": 8.849329124084785e-07, "2": 3.926865994834782e-07, "1": 0}, "score": 4.953963212879896}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9196356444724115, "4": 0.08035686915787571, "3": 4.909188032480026e-06, "2": 2.046454038201186e-06, "1": 0}, "score": 4.919627130447842}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt4", "target_model": "human", "scores": {"4": 0.4976477905832552, "2": 0.25817629847497925, "3": 0.2425341872962264, "1": 0.0014648717251078817, "5": 0.00015929734625109402}, "score": 3.236864501406023}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8807908957227387, "4": 0.11920208892092925, "3": 5.583554372725906e-06, "2": 1.1522315703070796e-06, "1": 0}, "score": 4.880783253946142}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6224438036371622, "4": 0.3775312621800266, "3": 1.972789369679261e-05, "2": 3.884652596085694e-06, "1": 0}, "score": 4.622417129047481}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8438916157417423, "4": 0.1561042384005623, "3": 3.000876936032988e-06, "2": 6.1926595739687e-07, "1": 0}, "score": 4.843887819977209}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.830932454184576, "5": 0.16881416237734423, "3": 0.00021040927402637575, "2": 4.2084502360473606e-05, "1": 0}, "score": 4.168519734024149}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9712566048141041, "3": 0.012614415899779132, "2": 0.011485556379505947, "5": 0.004640584271914904, "1": 1.3738218919063418e-06}, "score": 3.9690508888127933}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.944258909408634, "5": 0.05496245297823878, "3": 0.0004755183907835716, "2": 0.0003022578792975681, "1": 2.799639477788094e-07}, "score": 4.053881610262659}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9038906077845844, "5": 0.09526936295673867, "3": 0.0006940809233531207, "2": 0.00014548726513916255, "1": 1.9915707539121484e-07}, "score": 4.094283734726027}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6653682581147929, "4": 0.3345681443941851, "3": 4.678658693838862e-05, "2": 1.616901179054577e-05, "1": 1.5851541386464655e-07}, "score": 4.665288979543343}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5467034513723774, "5": 0.4532330801974234, "3": 5.172998313337682e-05, "2": 1.1542519421025943e-05, "1": 0}, "score": 4.4531583539616975}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8973137958047344, "3": 0.05918426300789082, "2": 0.03821223219876551, "5": 0.005252899863069631, "1": 3.4304809327213715e-05}, "score": 3.8695409313189053}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8985500413369903, "5": 0.1008145085171949, "3": 0.0005048002759930497, "2": 0.00012964339397955832, "1": 3.066379810502841e-07}, "score": 4.100049571557777}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9374343127428155, "5": 0.0580843740803824, "3": 0.0031760766555819202, "2": 0.0013034592331415042, "1": 1.0822330635956932e-06}, "score": 4.052298168609431}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5698080951595674, "5": 0.43011371576036234, "3": 6.205707697730644e-05, "2": 1.5690486259766197e-05, "1": 0}, "score": 4.430020467572141}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.592072757776753, "2": 0.27967535357910256, "3": 0.12804470733378537, "5": 0.00013865787358893203, "1": 6.549734175760321e-05}, "score": 3.312544671051183}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8998188488254615, "5": 0.08239861091800554, "3": 0.013451203464804147, "2": 0.004299262855206495, "1": 2.76416462615756e-05}, "score": 4.060266223921402}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6924549480530806, "5": 0.30727502055088846, "3": 0.00022514588231809242, "2": 4.364652017208896e-05, "1": 2.5953169579688474e-07}, "score": 4.306962103690807}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9509674701147172, "3": 0.026558636295181327, "2": 0.01610862719318422, "5": 0.0063082290468898326, "1": 5.543629690257992e-05}, "score": 3.947365945204714}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8665400244089948, "5": 0.1328882140552806, "3": 0.00048681713412855116, "2": 8.199338374433579e-05, "1": 1.367369140135821e-06}, "score": 4.132233517457683}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.918840665303897, "5": 0.08028739854863667, "3": 0.0007749071052412917, "2": 9.548732899128338e-05, "1": 8.391368776362062e-07}, "score": 4.079319055102473}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9730321268460124, "5": 0.025132629424783948, "3": 0.0009744980890236072, "2": 0.0008599915451379407, "1": 3.4799142440149786e-07}, "score": 4.0224371133830035}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9913227168348665, "5": 0.006081736592623562, "3": 0.0019438397684067223, "2": 0.0006511047645858743, "1": 0}, "score": 4.002835689002242}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.5178664751146508, "4": 0.3240725397926894, "3": 0.1579403419266823, "5": 9.445254678571825e-05, "1": 2.042679578812109e-05}, "score": 2.806353000032923}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9848241216044039, "5": 0.01495376756287806, "3": 0.0001314128058054335, "2": 9.031861252591448e-05, "1": 0}, "score": 4.014641723087301}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.991491802333986, "5": 0.0071114835507923345, "3": 0.0009041236734640982, "2": 0.0004915635149358816, "1": 0}, "score": 4.005224238212366}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9474198970229137, "5": 0.05180530095054279, "3": 0.0005577983727719733, "2": 0.0002150504298282901, "1": 8.002129157509595e-07}, "score": 4.0508150596696915}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9693305891514848, "5": 0.028370664721465502, "3": 0.0020233020985256115, "2": 0.00027382399828274827, "1": 7.691152566983473e-07}, "score": 4.025797429232023}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9385184632504185, "5": 0.05462832816044766, "3": 0.006323687979228852, "2": 0.0005272542383717272, "1": 1.0178398199562987e-06}, "score": 4.047247137174564}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8477579247840241, "5": 0.15199461293211525, "3": 0.0002249719117993286, "2": 2.125517846099227e-05, "1": 0}, "score": 4.151727318076007}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7368658389988847, "5": 0.26273759040694855, "3": 0.0003378700175183366, "2": 5.7802761882111483e-05, "1": 0}, "score": 4.26228435034843}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9697132827231569, "5": 0.022805471357276466, "2": 0.004088794891089315, "3": 0.0033897300229803005, "1": 1.788953045516232e-06}, "score": 4.011232795162536}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9905407666924263, "2": 0.003923566175865707, "3": 0.003923566175865707, "5": 0.001610228314164173, "1": 8.631917331753321e-07}, "score": 3.989836929952257}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9428314975132581, "2": 0.030307268825683367, "3": 0.022877126737752683, "5": 0.00397544733540052, "1": 7.322988853562843e-06}, "score": 3.9204617076689146}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9847262127954236, "5": 0.014952272260888109, "3": 0.0002825539647378901, "2": 3.884170567823005e-05, "1": 0}, "score": 4.014592036625235}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8691618434789308, "5": 0.12718647021088944, "3": 0.0035520655486878726, "2": 7.488170172686138e-05, "1": 0}, "score": 4.123487696228246}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9213250531292297, "5": 0.07562697101216408, "3": 0.0027120035497499393, "2": 0.0003341842735205887, "1": 9.684509506873137e-07}, "score": 4.072243752772373}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.9201115649879164, "4": 0.051909145004854364, "3": 0.027784963108497755, "1": 0.00018145352457440864, "5": 6.6094441494781905e-06}, "score": 2.1314424512723953}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5167420836678066, "2": 0.4283942339498244, "3": 0.05361983089213392, "5": 0.0011662502400174473, "1": 7.455585365377738e-05}, "score": 3.0905315141950713}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5466157726373959, "4": 0.4531603919730785, "3": 0.0001862566493749256, "2": 3.7253673520542476e-05, "1": 1.0965957967079169e-07}, "score": 4.546354797350917}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9334308078107684, "2": 0.038527292220009085, "3": 0.02731994110578072, "5": 0.0007167641582465049, "1": 3.3715465565954804e-06}, "score": 3.89633193496945}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7651167518522757, "5": 0.23334741136627443, "3": 0.0010473658303042992, "2": 0.00048707034486738436, "1": 3.9196158476756336e-07}, "score": 4.231324962286176}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8482097475209136, "5": 0.14739675712171824, "3": 0.002829224593783555, "2": 0.0015624462139784442, "1": 9.946479315910967e-07}, "score": 4.141439773537288}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9171112395120218, "5": 0.07767076090181074, "3": 0.0037480244168226744, "2": 0.0014677474505497875, "1": 7.746132224308692e-07}, "score": 4.07098502089295}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8932965467539459, "4": 0.10668906601622481, "3": 1.1439228649829978e-05, "2": 2.6334599658977814e-06, "1": 0}, "score": 4.893280121578778}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6586549091384897, "2": 0.26612062381487195, "3": 0.07506276865982225, "5": 9.355781224176972e-05, "1": 3.606974978503906e-05}, "score": 3.392661854438067}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9428204721061918, "3": 0.03655711671410505, "2": 0.01205525758614418, "5": 0.008548457685210186, "1": 1.3896410341396393e-05}, "score": 3.947838886220631}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8703586333781774, "5": 0.1293672526052527, "3": 0.00023460671475744696, "2": 3.890160688870901e-05, "1": 1.092667168533817e-07}, "score": 4.129054578942901}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9560394797249537, "3": 0.02932452741508718, "2": 0.01222428172437103, "5": 0.0024071037925139137, "1": 2.907895308920585e-06}, "score": 3.948625201933972}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6370219535704486, "4": 0.36296418989883183, "3": 1.0977070069258726e-05, "2": 2.1280020992408537e-06, "1": 0}, "score": 4.637007199180688}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9868263679708987, "2": 0.00559917339596242, "3": 0.004226477817675712, "5": 0.0033434191433459543, "1": 2.7329307221111976e-06}, "score": 3.9879103736327792}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9480980374902329, "2": 0.02647849724738754, "5": 0.012904586347327864, "3": 0.012507553964999855, "1": 8.74483777732714e-06}, "score": 3.94741366769558}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5544031218942022, "5": 0.44547542336567936, "3": 0.00010763787220487461, "2": 1.3263588286144116e-05, "1": 0}, "score": 4.445341504715284}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5389407176117742, "4": 0.4609804245049402, "3": 6.75579371561206e-05, "2": 1.0857548560683787e-05, "1": 0}, "score": 4.538851682964172}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6859235092665608, "5": 0.3140386850080131, "3": 3.2635366358555284e-05, "2": 4.486269714799828e-06, "1": 0}, "score": 4.31399729190443}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8072138112639327, "5": 0.19173010480958536, "3": 0.0007476754234738165, "2": 0.00030684525280000704, "1": 7.257632334763931e-07}, "score": 4.19036672102046}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6950712296249201, "2": 0.27219381807197063, "3": 0.03102022090145729, "5": 0.0016699008927052118, "1": 4.246348618083065e-05}, "score": 3.4261332950332086}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5389331724945436, "4": 0.460973970824173, "3": 6.547848123922208e-05, "2": 2.6872314556182913e-05, "1": 1.0982100761363053e-07}, "score": 4.5388138333261905}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7826087488953813, "4": 0.21732259857571434, "3": 5.010588959481386e-05, "2": 1.7588821495669255e-05, "1": 2.3203630278497207e-07}, "score": 4.782523337194856}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5621413546415366, "4": 0.437796127191649, "3": 4.409663862816701e-05, "2": 1.7816652576563246e-05, "1": 0}, "score": 4.562061964675329}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9169138626483019, "5": 0.08266229549168683, "2": 0.00021473282006443704, "3": 0.0002081261857392811, "1": 3.1290506472536514e-07}, "score": 4.082023819902412}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.928782738039456, "5": 0.06941651996186705, "3": 0.0014633821225040922, "2": 0.0003368896935618407, "1": 1.983455748580999e-07}, "score": 4.06727878170438}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9352322133544536, "5": 0.06364335872224712, "3": 0.0009366411749788569, "2": 0.00018734007684375326, "1": 2.6458983565649765e-07}, "score": 4.062331254973451}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9032659560109811, "5": 0.08943544489881675, "3": 0.006378237332310251, "2": 0.0009188722087101066, "1": 7.871374131673622e-07}, "score": 4.081217158784735}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6925826762224292, "5": 0.30733168728919075, "3": 7.904818142102896e-05, "2": 6.388072361192149e-06, "1": 0}, "score": 4.3072399244831105}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9817889581091582, "3": 0.01125290794199481, "5": 0.0044067020665612055, "2": 0.002550403492439502, "1": 3.5112308690837535e-07}, "score": 3.9880519256783926}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5308695799790354, "5": 0.46849076000788387, "3": 0.0005931198923854156, "2": 4.573649504926231e-05, "1": 1.9896955776086653e-07}, "score": 4.467805853078384}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.9872486453116617, "3": 0.012234958181912057, "1": 0.00041865724660695313, "4": 9.48860367152199e-05, "5": 0}, "score": 2.0120061072648383}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9463693241884781, "5": 0.04711695330228187, "3": 0.005044294885295559, "2": 0.0014679735010626152, "1": 6.225156925559914e-07}, "score": 4.039134876412628}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7488077380034651, "5": 0.2508191794653412, "3": 0.00027588595063057417, "2": 9.684507705669878e-05, "1": 1.2260806899379246e-07}, "score": 4.250349292840201}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7928814056852614, "5": 0.20683545607588133, "3": 0.00023108937904612586, "2": 5.156301015516327e-05, "1": 1.0269966314577459e-07}, "score": 4.206501011698396}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt4", "target_model": "human", "scores": {"4": 0.92740663744853, "5": 0.07151391734799331, "3": 0.0007821312442338552, "2": 0.0002968635358515436, "1": 1.0436588363595235e-07}, "score": 4.070137770206107}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7248149341166934, "4": 0.2751087238486179, "3": 6.244564872257052e-05, "2": 1.3717488587226916e-05, "1": 0}, "score": 4.724725183142232}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7547689221179603, "5": 0.24503757814874277, "3": 0.00016866551591610186, "2": 2.4298571387108042e-05, "1": 0}, "score": 4.244820446627143}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8871956198564858, "4": 0.11279427440808754, "3": 7.2215568363547375e-06, "2": 2.828002290482819e-06, "1": 0}, "score": 4.887182792133716}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6859071776222342, "5": 0.3140311795731317, "3": 3.8153693107663743e-05, "2": 2.3141384651064646e-05, "1": 0}, "score": 4.313946852278479}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt4", "target_model": "human", "scores": {"5": 0.9343859999038808, "4": 0.06560419742118577, "3": 9.174203314507886e-06, "2": 5.864871961719766e-07, "1": 0}, "score": 4.934375691955398}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5155142823960503, "4": 0.4842808509497647, "3": 0.00017842539487407898, "2": 2.5704615262181504e-05, "1": 0}, "score": 4.515284827352153}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8829151375161312, "5": 0.1158132498810179, "3": 0.0008842453399075058, "2": 0.0003862981798715023, "1": 0}, "score": 4.114156530224182}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9098565802617872, "4": 0.09008799176482322, "3": 4.829328663646616e-05, "2": 6.638709272786496e-06, "1": 0}, "score": 4.9097954607946654}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9688507700767244, "4": 0.031143659556643263, "3": 3.55459295699548e-06, "2": 1.6790708214934446e-06, "1": 0}, "score": 4.968844183554726}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6791622809860032, "5": 0.32081353900481185, "3": 2.152554905917913e-05, "2": 2.415099671183009e-06, "1": 0}, "score": 4.320787260040195}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9971101474858776, "3": 0.0012822435011822493, "2": 0.0008150435586135586, "5": 0.0007899673045541291, "1": 1.2642657994136763e-06}, "score": 3.997873841052698}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9045142633057288, "5": 0.09533509290073552, "3": 0.00012069643093696616, "2": 2.9577932450423306e-05, "1": 0}, "score": 4.095155275758125}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5926449823243116, "5": 0.4073185424807646, "3": 3.0015849474353455e-05, "2": 6.098089698569991e-06, "1": 0}, "score": 4.4072764775828634}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9966969278850223, "5": 0.0029338667972565674, "3": 0.00031409722067321576, "2": 5.373569854187002e-05, "1": 4.79662550533785e-07}, "score": 4.002510861433384}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9029411439854831, "2": 0.08140260532794731, "3": 0.01414565173497762, "5": 0.001490940723788832, "1": 1.847720957824727e-05}, "score": 3.8244844394171054}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9547270909307034, "3": 0.02708352417509988, "2": 0.017215330224596457, "5": 0.0007803991799680648, "1": 0.00016877324323630124}, "score": 3.938758370996664}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9849686694311844, "5": 0.012398927525383983, "3": 0.0020240692777607986, "2": 0.0006077358060235294, "1": 3.257876656991092e-07}, "score": 4.009158411765242}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7825597043419152, "5": 0.21730899460685218, "3": 0.00011290825180224282, "2": 1.8146007389358238e-05, "1": 0}, "score": 4.217159847933594}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.982560823779679, "5": 0.011619239235133123, "3": 0.0038919576344809918, "2": 0.0019266587383840639, "1": 8.973292368813298e-07}, "score": 4.003871273774818}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9531857724118792, "3": 0.03261622222873754, "2": 0.011629672183431883, "5": 0.0025546999464793178, "1": 1.2593622788873083e-05}, "score": 3.9466412970104474}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.886720719402899, "5": 0.11273388924371275, "3": 0.0005302826455913503, "2": 1.4809747190786211e-05, "1": 7.18740899122137e-08}, "score": 4.112173796954628}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9051056878011422, "5": 0.09246236334682742, "3": 0.0021745054926342873, "2": 0.0002556812516554495, "1": 5.506293170578658e-07}, "score": 4.089774952223349}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5774649679411167, "4": 0.42248239571489243, "3": 4.822017770121385e-05, "2": 4.020485063702216e-06, "1": 0}, "score": 4.577408935263164}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9654957664014318, "2": 0.016612276645488335, "3": 0.015125650011828685, "5": 0.0027545855039034237, "1": 1.0911012038018141e-05}, "score": 3.9543716121865837}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9782952626120673, "3": 0.008732587161991297, "5": 0.007239569034339129, "2": 0.005726970480657853, "1": 4.329454523424359e-06}, "score": 3.987040035942425}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9776738473348064, "5": 0.016051483560529347, "3": 0.005050823397378843, "2": 0.0012185678539386494, "1": 3.7008279243779e-06}, "score": 4.008552435458909}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9541751041972854, "2": 0.01949625077201718, "5": 0.018315034482623605, "3": 0.008001245995439873, "1": 1.0451312388736464e-05}, "score": 3.9712898780766226}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8174875873465064, "5": 0.1824061289877342, "3": 8.363738072091092e-05, "2": 2.216169965042526e-05, "1": 0}, "score": 4.182278256537091}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9832655351484668, "5": 0.013808084845464499, "3": 0.0025146390616099263, "2": 0.00041050354224925347, "1": 3.4619937483409396e-07}, "score": 4.010471409433381}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt4", "target_model": "human", "scores": {"5": 0.7431121377598137, "4": 0.25681266239248457, "3": 5.391197144391871e-05, "2": 2.0784916553789814e-05, "1": 3.011498064981416e-07}, "score": 4.743015902453807}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9416485002742055, "4": 0.0583454909007958, "3": 4.872039110413112e-06, "2": 1.0212348761880931e-06, "1": 0}, "score": 4.941641694572994}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9867730847328876, "4": 0.013222769147045912, "3": 3.0486399037483277e-06, "2": 8.334517707141741e-07, "1": 0}, "score": 4.986768629724377}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9073088396914479, "4": 0.0926874313263724, "3": 3.078641899324386e-06, "2": 5.104888708852445e-07, "1": 0}, "score": 4.907304866959671}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9539636223208832, "4": 0.046033789398643686, "3": 1.6024048914853788e-06, "2": 8.988676791637264e-07, "1": 0}, "score": 4.953960305182719}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt4", "target_model": "human", "scores": {"4": 0.961113496007907, "5": 0.03726641351242316, "3": 0.0012751862915822815, "2": 0.0003432117343288795, "1": 4.923691977174868e-07}, "score": 4.0353033690116185}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7662826979120606, "4": 0.23370302349866093, "3": 1.1472255531401468e-05, "2": 2.1555729493018984e-06, "1": 0}, "score": 4.766267413167423}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6921617970001981, "5": 0.30714494784552204, "3": 0.0005837366024964998, "2": 0.00010798048949325246, "1": 0}, "score": 4.306345721442841}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7879153726545222, "4": 0.21206454353691345, "3": 1.6635210409025593e-05, "2": 3.0772045092141144e-06, "1": 0}, "score": 4.787892875653503}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9281036227347815, "5": 0.07156765878546183, "3": 0.0002462934122620477, "2": 8.121894704687666e-05, "1": 0}, "score": 4.071159013305447}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9748941499808558, "5": 0.02292731235135891, "3": 0.0017958058792389572, "2": 0.00038234913530652703, "1": 0}, "score": 4.020366815994935}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9624768221435165, "5": 0.03731927984302019, "3": 0.00018980847889482947, "2": 1.3749680094182295e-05, "1": 0}, "score": 4.037101984613212}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6441062706205305, "5": 0.3557092483300906, "3": 0.00016827819928607048, "2": 1.4703985183535723e-05, "1": 0}, "score": 4.355512095025041}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5926594667446785, "5": 0.40732849746759225, "3": 9.744963212740725e-06, "2": 1.2008150780925575e-06, "1": 0}, "score": 4.407316794853376}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9872599148192684, "5": 0.012045405235731436, "3": 0.000658647544747356, "2": 3.436585753397075e-05, "1": 0}, "score": 4.011318044837922}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8956109839364051, "5": 0.10367450991385017, "3": 0.0006261791786150343, "2": 8.74341604355559e-05, "1": 3.5732342961411485e-07}, "score": 4.10287244553096}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5543113203385951, "4": 0.44540165874344934, "3": 0.0002622325113110542, "2": 2.4013269129561253e-05, "1": 2.7096423471435206e-07}, "score": 4.554000527708584}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.904343918609096, "5": 0.09531714299277923, "3": 0.00027194220387506793, "2": 6.66423031252409e-05, "1": 1.1353314684203613e-07}, "score": 4.0949115983959725}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5467228924927693, "4": 0.4532491974523183, "3": 1.787802952194097e-05, "2": 9.873185607578713e-06, "1": 0}, "score": 4.546685354927415}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9281578394914242, "5": 0.07157184561596439, "3": 0.00020741198021981722, "2": 6.227636986678454e-05, "1": 0}, "score": 4.071239925530854}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.895590913519145, "5": 0.10048251969442284, "3": 0.0020531162871540607, "2": 0.001869383652571878, "1": 2.519321345630871e-06}, "score": 4.094683224662779}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.7882070577487748, "4": 0.14580365370740472, "3": 0.06571885554959982, "1": 0.00018459081377488737, "5": 7.816066828881397e-05}, "score": 2.357378799365093}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.83771845291004, "2": 0.1367537795049745, "3": 0.021302130239998832, "5": 0.004194638989903805, "1": 2.8708322346614946e-05}, "score": 3.709298159056184}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6925275696113278, "5": 0.30730725539123205, "2": 8.413970381105313e-05, "3": 8.028666624918001e-05, "1": 0}, "score": 4.307058919190076}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.946959995583851, "5": 0.047146363456156214, "2": 0.004250375274762096, "3": 0.0016386656440512493, "1": 3.2637817137943962e-06}, "score": 4.036997205355305}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8808455416850095, "5": 0.04524681491194049, "2": 0.03810163821518406, "3": 0.03579317665393703, "1": 1.182111758638915e-05}, "score": 3.9332148311944057}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9793693645669583, "5": 0.014189948743119112, "3": 0.004194540836499841, "2": 0.0022451759201261453, "1": 4.787458331943149e-07}, "score": 4.005503622532178}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.976077316481643, "2": 0.008989362905758025, "5": 0.008849995751667361, "3": 0.006082507197466628, "1": 0}, "score": 3.9847887503050017}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7538596868517091, "5": 0.24474241227324844, "2": 0.0007204215724578337, "3": 0.000676773435899514, "1": 3.627964150840419e-07}, "score": 4.242623790540197}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9837408278042128, "5": 0.009644256713804696, "2": 0.003332965935769304, "3": 0.0032812930884252764, "1": 4.4474355579729425e-07}, "score": 3.9996956974587485}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9033294740996822, "5": 0.09228090856350787, "3": 0.0035226455322455957, "2": 0.0008632614137029484, "1": 2.041822023405407e-06}, "score": 4.087025759946257}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9587039967319807, "5": 0.03957043620565497, "3": 0.001607945502949889, "2": 0.00011647918155800722, "1": 4.008522225019303e-07}, "score": 4.037728357759467}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9049950417739833, "5": 0.055205046929295634, "3": 0.030487122428068038, "2": 0.009298046078340566, "1": 1.292850492822681e-05}, "score": 4.006083057866165}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9720960096884759, "5": 0.026727806862236896, "3": 0.000928977536262352, "2": 0.0002461547880973082, "1": 0}, "score": 4.025306546350122}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8201293477542073, "2": 0.13388243699149058, "3": 0.04484499907673879, "5": 0.0011226728090961108, "1": 1.5280714726887005e-05}, "score": 3.688465318106037}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt4", "target_model": "human", "scores": {"4": 0.650385262589818, "5": 0.3481261725916172, "3": 0.0012753105007759706, "2": 0.0002114673383517906, "1": 9.34443193519116e-07}, "score": 4.346425419424782}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6223773488599993, "5": 0.37749094399425515, "3": 0.00011351404320706188, "2": 1.768207753539805e-05, "1": 0}, "score": 4.377342258627307}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6925454439785672, "4": 0.30731515328918313, "3": 0.00012242572970119336, "2": 1.6311649698539292e-05, "1": 1.4789607585532571e-07}, "score": 4.692390309543298}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7431484173799575, "4": 0.25682522083872705, "3": 2.3924440654997832e-05, "2": 2.3321149458908842e-06, "1": 0}, "score": 4.743119906904733}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9262950245986945, "4": 0.07369558401259535, "3": 8.280866046904581e-06, "2": 9.43718419240029e-07, "1": 0}, "score": 4.92628501080408}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9895515191040467, "5": 0.008561299410987384, "3": 0.0010386034549647889, "2": 0.0008476834347050796, "1": 0}, "score": 4.005827334299719}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9238372585158582, "5": 0.07583318388563974, "3": 0.00021299965755055826, "2": 0.00011580590511973707, "1": 2.2009204317974717e-07}, "score": 4.075387952243873}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7548342728402292, "5": 0.24505882382775512, "3": 9.762450697590182e-05, "2": 8.939713645469097e-06, "1": 0}, "score": 4.244943402956588}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5389804551757911, "5": 0.46101441384464054, "3": 4.319154035501024e-06, "2": 5.491188139497819e-07, "1": 0}, "score": 4.46100911756317}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9903685048416987, "5": 0.006993295322446754, "3": 0.0017137807228220156, "2": 0.0009173207178660197, "1": 4.314936282716077e-06}, "score": 4.003431937907703}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9717022360171466, "5": 0.02756507241170972, "3": 0.0006584769771227274, "2": 7.387906931240553e-05, "1": 0}, "score": 4.026758846274216}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6583893930107735, "5": 0.34156793109571887, "3": 3.6623003648625874e-05, "2": 5.443523524817482e-06, "1": 0}, "score": 4.341520629156194}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9190214613142956, "5": 0.08030320869386864, "3": 0.0006227776530940878, "2": 5.1925736727620365e-05, "1": 0}, "score": 4.079576629430195}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7606404524366471, "4": 0.2393461376745882, "3": 1.138777666698007e-05, "2": 1.0928517432613024e-06, "1": 0}, "score": 4.760627585777554}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9631245116069072, "5": 0.032956307827904555, "3": 0.0032125270775081806, "2": 0.0007056985462294977, "1": 0}, "score": 4.02833241071373}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9579169699171292, "5": 0.034892118717132325, "3": 0.003677603359387102, "2": 0.003509193640317853, "1": 2.1316387667466115e-06}, "score": 4.024189781122548}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9742254626179164, "5": 0.02401113494948651, "2": 0.001158664071542547, "3": 0.0005917877013391096, "1": 5.200592482110645e-06}, "score": 4.021086580750034}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8696567981919144, "2": 0.06918947661224696, "3": 0.057360090783214523, "5": 0.003783308074835709, "1": 7.654001308533798e-06}, "score": 3.8080207890301527}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7662849584493537, "4": 0.23370372460878308, "3": 7.523711433991573e-06, "2": 3.286866101135881e-06, "1": 0}, "score": 4.766271249018144}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7771987576303567, "5": 0.2226711632680308, "3": 9.895859773486417e-05, "2": 3.06559434757782e-05, "1": 0}, "score": 4.222510996153141}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9873426575781125, "5": 0.010630925771169185, "3": 0.0016559788414547503, "2": 0.00036949882409620974, "1": 2.927379490387217e-07}, "score": 4.008235076389571}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6625854157489947, "2": 0.2325893562111131, "3": 0.10003543557632213, "5": 0.004534769607059752, "1": 0.00024796300408596976}, "score": 3.438572769002856}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9639258966705465, "5": 0.032983732289007944, "3": 0.0020120201739113634, "2": 0.0010769567924968234, "1": 3.906354753184806e-07}, "score": 4.028816655539421}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9499084637283979, "5": 0.04879440130799009, "3": 0.0009969951027504564, "2": 0.000299352125570035, "1": 1.8470331534695755e-07}, "score": 4.047198176306163}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9016429318390425, "5": 0.09804912994147591, "3": 0.0002711300399399163, "2": 3.6124581369007536e-05, "1": 0}, "score": 4.097705817530316}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9613505358218303, "2": 0.019952197327142776, "3": 0.0128821029386368, "5": 0.00580641870537948, "1": 7.948391315700149e-06}, "score": 3.9529960384850154}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8801753059878512, "5": 0.11545386107988254, "2": 0.0031251937428610987, "3": 0.0012431161842313587, "1": 9.397668728948421e-07}, "score": 4.10795770903209}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9710782741935263, "5": 0.027547373050458034, "3": 0.0007456729937812508, "2": 0.0006279196158045755, "1": 0}, "score": 4.025545880243677}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9282119665940297, "5": 0.07157603269140367, "3": 0.00016154206254783012, "2": 5.0043396448433965e-05, "1": 0}, "score": 4.0713144334496745}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9815218830471506, "5": 0.01742409953996398, "3": 0.0005962198995327333, "2": 0.0004571376540784189, "1": 1.8497854343997315e-07}, "score": 4.0159130569534485}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8467721574378425, "5": 0.15181787004008473, "2": 0.0009027420538549761, "3": 0.0005063923975418806, "1": 5.071550812243977e-07}, "score": 4.149504521542967}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9844100246542213, "5": 0.009501194988720088, "2": 0.004216129718800375, "3": 0.0018708962216705662, "1": 1.4592499312146207e-06}, "score": 3.9991936613416508}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6854709079834682, "5": 0.31383145647534116, "3": 0.0005181999947331524, "2": 0.00017908517989076027, "1": 1.607727435267297e-07}, "score": 4.312954663136867}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9928889219216274, "2": 0.0029686846590698756, "5": 0.002422969802697167, "3": 0.0017181428669516845, "1": 9.502782504753986e-07}, "score": 3.9947646050527066}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9734274167643838, "5": 0.023619515044167712, "3": 0.00179310378965981, "2": 0.0011577148195261254, "1": 1.6350993351780733e-06}, "score": 4.019506088303609}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9601158670111554, "3": 0.019926567248678844, "2": 0.01871927757044009, "5": 0.0012346701865412933, "1": 2.7433630491256806e-06}, "score": 3.9438612686077694}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9548774952068058, "5": 0.04328616976325475, "3": 0.0010022107190259368, "2": 0.0008308618686250173, "1": 1.7342734379939027e-06}, "score": 4.040617094556443}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9215388161227849, "5": 0.07804573328084283, "3": 0.00029963035291127925, "2": 0.00011551779160444763, "1": 0}, "score": 4.077515090789306}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5311779242222665, "5": 0.46876287284746515, "3": 4.721575163333568e-05, "2": 1.1570717556148063e-05, "1": 0}, "score": 4.4686927108529915}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9037797930699749, "5": 0.09525768364879637, "3": 0.0005664228918498007, "2": 0.000395426906789311, "1": 0}, "score": 4.0939004701837005}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6779001589982213, "2": 0.2738964126766115, "3": 0.04759605972774526, "5": 0.0005898570727428915, "1": 1.6218143066775904e-05}, "score": 3.405151548196524}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7548912574303422, "5": 0.24507730195968858, "3": 2.6277276596185174e-05, "2": 4.860807410513778e-06, "1": 0}, "score": 4.245041377199651}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7658292464136983, "5": 0.23356471225291786, "3": 0.0005189666162940803, "2": 8.605310089401429e-05, "1": 0}, "score": 4.23287387734256}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9145508632992104, "5": 0.08506649790984637, "3": 0.0002837414845543864, "2": 9.805843318445839e-05, "1": 0}, "score": 4.084586710516448}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5155992306826331, "5": 0.4843606524798442, "3": 3.353063699176078e-05, "2": 6.20254417051955e-06, "1": 0}, "score": 4.484314902565004}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9334314332096192, "3": 0.03507952331789238, "2": 0.021276806420405973, "5": 0.010208723286714995, "1": 2.4666786212038773e-06}, "score": 3.932568116485115}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8595498130432835, "3": 0.07995059480640139, "2": 0.06034987516244842, "5": 0.00010443235674777907, "1": 3.841851704058967e-05}, "score": 3.799337453902395}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9268826060508215, "5": 0.05925362022438348, "3": 0.011133429833784072, "2": 0.0027283643187193504, "1": 7.828662287965762e-07}, "score": 4.042661164207348}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6076329378318347, "4": 0.392317310920175, "3": 4.692621891577899e-05, "2": 2.647396112737383e-06, "1": 0}, "score": 4.607580824747075}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8277788248715953, "3": 0.09001677834243398, "2": 0.081961209378836, "5": 0.00023383729616142669, "1": 6.231552866276045e-06}, "score": 3.7462751542817823}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6306995555537702, "2": 0.3375891349443291, "3": 0.02904088541479938, "5": 0.002618115224627999, "1": 5.1045100116866664e-05}, "score": 3.2982449377691885}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9885771913919522, "5": 0.006980648906372251, "3": 0.0041037117907709204, "2": 0.00033685317669830824, "1": 8.092855625767198e-07}, "score": 4.0022008046341355}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9092057161617773, "5": 0.09002356586340733, "3": 0.0007431898705983543, "2": 2.7070689057701126e-05, "1": 0}, "score": 4.089226275428143}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7488986637590044, "5": 0.25084960567712283, "3": 0.00023234760737269323, "2": 1.9072253031453703e-05, "1": 7.554578051643371e-08}, "score": 4.2505789458519105}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9060321390529068, "5": 0.09255700999900664, "3": 0.0012997861864541339, "2": 0.00011007974503071404, "1": 3.614813092513578e-07}, "score": 4.091036036642745}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9886512929724403, "3": 0.005269664398266396, "2": 0.0047236966375175035, "5": 0.0013533617455611154, "1": 1.4655367505045427e-06}, "score": 3.9866319005278488}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7487859629910542, "5": 0.2508118807334158, "3": 0.00037708044926707684, "2": 2.3732218562471313e-05, "1": 0}, "score": 4.250387672269829}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9149005482966671, "4": 0.08509899951946015, "3": 3.766064853802587e-07, "2": 3.5029859871067906e-08, "1": 0}, "score": 4.9149001387274005}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9263022904853643, "4": 0.07369616621000873, "3": 1.1383519493445152e-06, "2": 1.218708450630375e-07, "1": 0}, "score": 4.926301170610758}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7879099675736051, "5": 0.21206308029661122, "3": 2.203789690424445e-05, "2": 4.692139012755195e-06, "1": 0}, "score": 4.212031705212622}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5321912988345257, "4": 0.31285911549863604, "3": 0.15011144411168836, "5": 0.0031645259925151856, "1": 0.0016675880132636278}, "score": 2.783660388624925}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.8863321867796804, "3": 0.07162662618868096, "4": 0.04081162139573254, "1": 0.001194486850058883, "5": 2.898335089237212e-05}, "score": 2.1521432595621066}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9549541310204303, "5": 0.034784200636198116, "3": 0.008658472133286601, "2": 0.0016016562962737387, "1": 6.481024832081647e-07}, "score": 4.022920492043668}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6642568114817393, "5": 0.33400928065475144, "3": 0.0014991814797173856, "2": 0.0002335274333911352, "1": 3.9784195838810497e-07}, "score": 4.33204211678412}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9736037905328456, "3": 0.022896967517665144, "2": 0.002163287983709759, "5": 0.0013327630640279143, "1": 2.0352823535931544e-06}, "score": 3.9741030838049034}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9522679763865803, "5": 0.0474106353963069, "3": 0.00027324028091835933, "2": 4.748204112469071e-05, "1": 0}, "score": 4.047042462358484}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7979765563271692, "5": 0.20176006189302234, "3": 0.00022541869913882354, "2": 3.679859105762192e-05, "1": 0}, "score": 4.201461280611337}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.940744580833315, "3": 0.031200111826201457, "5": 0.015445169164012429, "2": 0.012605979677773082, "1": 3.293420063989138e-06}, "score": 3.9590231822739033}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5078087137762923, "4": 0.4921850821486679, "3": 5.391025130176729e-06, "2": 5.771578717364414e-07, "1": 0}, "score": 4.507802288221935}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9643567405661453, "5": 0.03512669135612418, "3": 0.00036089662427106305, "2": 0.00015521970392407444, "1": 1.6291389943897824e-07}, "score": 4.0344548765341015}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.871035626483506, "2": 0.07611023721262258, "3": 0.052309750042473194, "5": 0.0005374378137524275, "1": 5.268857563663185e-06}, "score": 3.795991064121958}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9122259841175518, "5": 0.08754368089097028, "3": 0.00020385186089378718, "2": 2.632498683603526e-05, "1": 0}, "score": 4.087287192860328}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.974776667691702, "5": 0.022924552069124138, "3": 0.0014885958290059, "2": 0.0008093355140468948, "1": 2.5505235477975557e-07}, "score": 4.019816531822884}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.692552951211869, "5": 0.30731850304261005, "3": 9.534620761668637e-05, "2": 3.29507676456111e-05, "1": 0}, "score": 4.307157331711311}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9841713115296937, "3": 0.008382740410394683, "2": 0.0038378982229497595, "5": 0.0036053717243876298, "1": 1.6531466922828409e-06}, "score": 3.9875418626588504}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7717500892142035, "5": 0.22812889062415406, "3": 8.1464436085691e-05, "2": 3.908706359754675e-05, "1": 0}, "score": 4.22796935890144}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5074787707376274, "5": 0.4918652903901097, "3": 0.0005669863095173921, "2": 8.695011452748371e-05, "1": 0}, "score": 4.491125387304694}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7309898897787703, "5": 0.268916138707981, "3": 7.837700321310196e-05, "2": 1.4958512831776761e-05, "1": 0}, "score": 4.268808015640251}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7371495132499228, "4": 0.262838763853894, "3": 9.739322512180942e-06, "2": 1.4030824382739448e-06, "1": 0}, "score": 4.7371373956643295}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6076471201501107, "4": 0.3923264677130713, "3": 1.866638957880495e-05, "2": 7.196534264371757e-06, "1": 0}, "score": 4.607614394401712}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9350672809939721, "5": 0.030057688314290325, "2": 0.02131409261343961, "3": 0.013548058853000368, "1": 1.1605725546830235e-05}, "score": 3.9738465937514134}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9506271379281602, "5": 0.04048258489256547, "3": 0.007606452338285011, "2": 0.0012811356087998995, "1": 1.2830660407000044e-06}, "score": 4.030310054759531}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9659227914491031, "5": 0.015858553043627543, "2": 0.009178226359892492, "3": 0.009035931149343278, "1": 3.488907179040093e-06}, "score": 3.9884556908037054}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5850390393764826, "4": 0.4148547997891004, "3": 0.00010023912264085602, "2": 5.6551043266427795e-06, "1": 0}, "score": 4.5849276459912565}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9010796937070508, "5": 0.0979878781802815, "3": 0.0008611113805985459, "2": 7.068437597050111e-05, "1": 0}, "score": 4.0969854593770885}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt4", "target_model": "human", "scores": {"2": 0.6840933459388692, "3": 0.23641635789754903, "4": 0.07918956055688912, "1": 0.0002331016344848797, "5": 6.574933506745804e-05}, "score": 2.3947603693620985}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9101072220351273, "5": 0.0467499075869092, "3": 0.035844397510736294, "2": 0.007282231055910411, "1": 1.5200343981595214e-05}, "score": 3.996295443074232}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6553363393169619, "5": 0.3399840072425978, "3": 0.004020469870389689, "2": 0.0006563236642974644, "1": 2.3303758369095547e-06}, "score": 4.334644076120152}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8772859368601914, "5": 0.11153439057368793, "3": 0.007954262742431516, "2": 0.003213812666756872, "1": 1.0553563315973746e-05}, "score": 4.097120943162591}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6853202032093109, "5": 0.2683752476520534, "3": 0.024575774442921815, "2": 0.021688044824496162, "1": 3.93311394664094e-05}, "score": 4.200305670315641}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8462948733891605, "1": 0.1470640018826496, "3": 0.006361365012829226, "4": 0.000270899677323949, "5": 6.174936246234311e-06}, "score": 1.8598573109961813}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.6107902918006356, "4": 0.2976754142581834, "3": 0.09078586293908553, "5": 0.0004992635227030584, "1": 0.0002358352712109138}, "score": 2.6874078114163975}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7724840173027476, "3": 0.1078629326532877, "2": 0.07530046265789589, "5": 0.044266858368658714, "1": 8.154186407244284e-05}, "score": 3.7855574769036355}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8430574110812307, "5": 0.14199403916119918, "3": 0.012214945939857398, "2": 0.002725522843764794, "1": 5.179924899313552e-06}, "score": 4.124312868396843}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9896247154734907, "3": 0.00842919166050107, "1": 0.0011587315077538863, "4": 0.0007840369567602913, "5": 1.6365355828148074e-06}, "score": 2.0088434585995887}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9312135509256185, "4": 0.04028034282984686, "3": 0.02600694399210093, "1": 0.0023815191419151085, "5": 0.00011313927229143413}, "score": 2.1045259990949443}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.947379771797733, "3": 0.029058907970129316, "4": 0.02125995123106874, "1": 0.002240782822134218, "5": 5.6096900304575424e-05}, "score": 2.069506630345676}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.9235371063685647, "3": 0.04387461816614072, "4": 0.030629419816245094, "1": 0.001927716764433012, "5": 2.74974028381717e-05}, "score": 2.103288609366301}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.956264409688149, "5": 0.021797260112471597, "2": 0.011308274099639129, "3": 0.010623140407076294, "1": 6.45296398597572e-06}, "score": 3.988538207310459}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9886587414993401, "1": 0.009394263894105229, "3": 0.0015577216593954033, "4": 0.00038774757886074083, "5": 0}, "score": 1.9929389421522978}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9854099455665287, "3": 0.010946914973445528, "4": 0.0034988441775922097, "1": 0.00013997146185875363, "5": 2.059964105148068e-06}, "score": 2.0178108520802995}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9388056093517041, "5": 0.0600158370953477, "3": 0.0007794694983458692, "2": 0.0003981140643085111, "1": 2.4950871312996985e-07}, "score": 4.05843943304678}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9856837659609853, "5": 0.012801798629482046, "3": 0.0009419629644794725, "2": 0.0005713294182706024, "1": 3.062711549761717e-07}, "score": 4.010716266981893}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9576262115353926, "5": 0.04207515731473322, "3": 0.00024630917554485215, "2": 5.162920795399972e-05, "1": 0}, "score": 4.041725618629387}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.5252540650604838, "4": 0.39648256941336374, "3": 0.07807204693244862, "5": 0.00016296126881895078, "1": 2.1712487545649555e-05}, "score": 2.871510148121261}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt4", "target_model": "human", "scores": {"5": 0.9381174261669548, "4": 0.061875548096949416, "3": 4.419407149248866e-06, "2": 2.29275822527225e-06, "1": 0}, "score": 4.9381087154067815}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5389642967839604, "5": 0.4610005928396914, "3": 2.9057585209167495e-05, "2": 5.545737185561575e-06, "1": 0}, "score": 4.460960677512044}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6001531838106667, "5": 0.3997882088388315, "3": 4.422607547301891e-05, "2": 1.3916352088641449e-05, "1": 0}, "score": 4.399716335896476}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6513454254798625, "4": 0.3486400724424583, "3": 1.1947780847139082e-05, "2": 2.044024294357412e-06, "1": 0}, "score": 4.651329722006097}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9724143493655333, "4": 0.02758527398269047, "3": 1.9508158134528683e-07, "2": 4.633593699156977e-08, "1": 0}, "score": 4.97241419311579}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8992751905092803, "2": 0.05572000167553008, "3": 0.035975536974365674, "5": 0.008955016508284246, "1": 6.944913110008986e-05}, "score": 3.861330462454496}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9381084015207237, "2": 0.048947122314365384, "3": 0.012375766909039002, "5": 0.0005270237204996936, "1": 3.586443220365403e-05}, "score": 3.890148779430831}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.938464912914711, "5": 0.0412332751222905, "3": 0.016401458748965175, "2": 0.0038956879164145767, "1": 2.6814979044713976e-06}, "score": 4.017032429835711}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9096290681385256, "5": 0.09006546357535035, "3": 0.00027353171036211443, "2": 3.117269520516501e-05, "1": 0}, "score": 4.089729655017317}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9836713732350144, "5": 0.012976849717179544, "3": 0.0028064405690122096, "2": 0.0005440533206558981, "1": 3.3568654976427104e-07}, "score": 4.009081304051484}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8592281007910185, "5": 0.14026512461521484, "3": 0.0004678578722237141, "2": 3.8404112797663795e-05, "1": 0}, "score": 4.1397205301393605}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.615067322307528, "4": 0.3848992951303643, "3": 2.926410143844032e-05, "2": 3.8990641311383206e-06, "1": 0}, "score": 4.615030395013367}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9415510550549018, "5": 0.0548048437135963, "3": 0.0031900234854578256, "2": 0.0004524415384348423, "1": 7.829272947439636e-07}, "score": 4.050707631637208}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6367156578929238, "5": 0.3627896461046382, "3": 0.00041819739502765906, "2": 7.49786613682545e-05, "1": 0}, "score": 4.3622220419448325}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9866912570074685, "5": 0.010297048275615736, "3": 0.0025631379741049717, "2": 0.0004454065933678058, "1": 0}, "score": 4.006843118671622}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9590302800386822, "5": 0.03082797567876427, "3": 0.008427902092831455, "2": 0.0017122321651021337, "1": 8.758394842128053e-07}, "score": 4.018972995666968}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5155752197855583, "5": 0.4843380963294823, "3": 7.918513231987562e-05, "2": 7.365364635812031e-06, "1": 0}, "score": 4.484244245060264}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7823519623193863, "5": 0.21725130672718895, "3": 0.00034229914850520966, "2": 5.4159562895915285e-05, "1": 1.8349544365097146e-07}, "score": 4.216800157206833}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.584994461100136, "4": 0.41482318905774057, "3": 0.00016269179097348123, "2": 1.9430763508591564e-05, "1": 0}, "score": 4.584793040698376}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7766129939349421, "5": 0.22250335474141517, "3": 0.0006348077886070509, "2": 0.00024859437645507885, "1": 1.5580073280854455e-07}, "score": 4.221370911464412}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9747344305590094, "2": 0.010828319509001226, "5": 0.007442187905859666, "3": 0.006991288534677037, "1": 2.273159145333427e-06}, "score": 3.9787874090498088}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.961654817763902, "5": 0.03502827452679636, "3": 0.0022745462432254447, "2": 0.0010413631530409011, "1": 2.896116353292641e-07}, "score": 4.030670154878566}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7977068140343959, "5": 0.20169187851574238, "3": 0.0005239370575696516, "2": 7.666893125781642e-05, "1": 0}, "score": 4.201014744599667}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7825710045856334, "5": 0.21731212387890522, "3": 9.964257747804063e-05, "2": 1.652235905709696e-05, "1": 0}, "score": 4.217179590042177}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8632486815696713, "5": 0.13658577137118597, "3": 0.00015744600246094271, "2": 7.597601139774325e-06, "1": 0}, "score": 4.136413198844426}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt4", "target_model": "human", "scores": {"2": 0.6264827242789209, "4": 0.20984542305406603, "3": 0.16342777979845688, "1": 0.000156178808308938, "5": 8.230044855936924e-05}, "score": 2.5832126107088333}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9947925385831945, "3": 0.0026248776330659103, "2": 0.0013406563117992364, "5": 0.001239904398898338, "1": 7.414960517961976e-07}, "score": 3.9959314844399625}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9875260646232504, "5": 0.006758682529547266, "3": 0.004868096406129779, "2": 0.0008459483095901113, "1": 0}, "score": 4.000198689744281}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9963603594072408, "5": 0.0020157349714285955, "3": 0.0015455176132243586, "2": 7.57538719522446e-05, "1": 0}, "score": 4.0003187104538265}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9917289390117298, "5": 0.0058970355705976335, "3": 0.0016121598133765043, "2": 0.000761530373512257, "1": 2.289972138637564e-07}, "score": 4.00276112831188}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9428745198960378, "5": 0.04694295208179677, "3": 0.008416409221005458, "2": 0.0017641752116462446, "1": 1.2726019167250321e-06}, "score": 4.034994398112556}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6722696392862119, "4": 0.32763804541526304, "3": 7.208093305743401e-05, "2": 1.9400319945401096e-05, "1": 0}, "score": 4.672159318324733}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5077836540346218, "4": 0.49216079341419333, "3": 5.0353118715148786e-05, "2": 4.9856339057352515e-06, "1": 0}, "score": 4.507723438198637}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.538979813789431, "4": 0.4610138652378145, "3": 5.291932854003588e-06, "2": 7.7438087331825e-07, "1": 0}, "score": 4.538973110349198}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7185765411848505, "4": 0.2813986026560096, "3": 1.9480277781908322e-05, "2": 4.849024535231371e-06, "1": 0}, "score": 4.718547741429779}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9960395277390864, "3": 0.0035365867920381217, "1": 0.0002260864748041786, "4": 0.0001964273333272603, "5": 0}, "score": 2.003703360063642}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.9773759671496525, "4": 0.012893796174467306, "3": 0.009143070582402444, "1": 0.000575435161953971, "5": 1.0539473169697102e-05}, "score": 2.034386887159436}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.8543303442707183, "3": 0.07465055651759583, "4": 0.07012770793892517, "1": 0.0008292927739318337, "5": 5.732280616953412e-05}, "score": 2.2142496712306055}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5895380351802602, "2": 0.3806343636873298, "3": 0.02935136576675689, "5": 0.000387210920185937, "1": 8.6398434632309e-05}, "score": 3.209505846628661}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.8838605832834785, "1": 0.11593727116051397, "3": 0.0001798376605232262, "4": 2.1145551617652064e-05, "5": 0}, "score": 1.8842847231023023}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7033239376927855, "2": 0.21450166036814317, "3": 0.08141564706993648, "5": 0.0006413482223203439, "1": 0.00011320479889821293}, "score": 3.4898806225753596}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8277881374357581, "2": 0.0958234349716198, "3": 0.07580257620788054, "5": 0.00047980873606618573, "1": 9.747905729568292e-05}, "score": 3.7327356366702604}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9159242401392527, "5": 0.0695334950043325, "3": 0.012083112045416847, "2": 0.0024548331092138984, "1": 2.617091424964298e-06}, "score": 4.052532954909365}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6513093875344697, "4": 0.3486207931795288, "3": 6.560261500025278e-05, "2": 3.8185300998953595e-06, "1": 0}, "score": 4.65123640714312}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9312981182679001, "5": 0.06746301211230271, "3": 0.0011250520249443663, "2": 0.00011314945528416816, "1": 0}, "score": 4.066111705348637}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.907333074234207, "5": 0.038039860823494795, "2": 0.03357005935148325, "3": 0.021007606343635292, "1": 4.8159362219595326e-05}, "score": 3.949747595383034}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9758947212098817, "5": 0.02367938359314563, "3": 0.0002756782867050297, "2": 0.00014988368470102582, "1": 0}, "score": 4.023103945635864}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.893888054794291, "2": 0.09131641642882683, "3": 0.011792406165161404, "5": 0.0029815872083648097, "1": 1.887258911488397e-05}, "score": 3.8084992204872017}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9283423152699453, "5": 0.07158608267188568, "3": 5.6714536751121495e-05, "2": 1.4794870871462037e-05, "1": 0}, "score": 4.0714997850178865}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.983945401253809, "5": 0.015903994100697275, "3": 0.00011230299802550993, "2": 3.820917071847302e-05, "1": 0}, "score": 4.015715274214532}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt4", "target_model": "human", "scores": {"4": 0.986216480715366, "2": 0.006242470259616928, "3": 0.005094955736398726, "5": 0.0024445864780285667, "1": 1.2504525902279735e-06}, "score": 3.984860934983605}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9180119050331857, "5": 0.08021499592340144, "3": 0.0013377114476344212, "2": 0.0004342913220880247, "1": 0}, "score": 4.078008787350573}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5619257810488968, "5": 0.43762823830889164, "3": 0.00037488715398007144, "2": 7.043920926868498e-05, "1": 0}, "score": 4.4371127587300565}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.72480091633142, "5": 0.2751033867911449, "3": 8.272547187770037e-05, "2": 1.2886143128790326e-05, "1": 0}, "score": 4.274994912479744}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6370045248882243, "4": 0.3629542448162768, "3": 3.328668802206477e-05, "2": 7.783705872176292e-06, "1": 0}, "score": 4.636955772638708}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt4", "target_model": "human", "scores": {"4": 0.822263101764321, "2": 0.1428878960318648, "3": 0.03289465817154723, "5": 0.0016635190679875867, "1": 0.0002890762684492118}, "score": 3.682125284161173}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9709838647268414, "5": 0.01619268632666689, "3": 0.010133124175771046, "2": 0.0026850106085131724, "1": 4.869248231665971e-06}, "score": 4.000674933489462}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9862650619495112, "5": 0.007648811520577986, "3": 0.0055959900513219835, "2": 0.0004889721612837755, "1": 6.487586949082866e-07}, "score": 4.001072931423764}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9348797010029962, "2": 0.033005287601588565, "3": 0.031005598314847952, "5": 0.0010776608137746178, "1": 3.0570899445652703e-05}, "score": 3.903969661150306}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7133611964166601, "2": 0.18036595656477872, "3": 0.10603167592813578, "5": 0.00018063755371073057, "1": 5.77352299335857e-05}, "score": 3.533242536675642}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8578511923717542, "5": 0.14004036170917705, "3": 0.001966599047415018, "2": 0.00014025126415769312, "1": 0}, "score": 4.137793479997756}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6648551909559285, "5": 0.33431019147674457, "3": 0.0006978118830850345, "2": 0.00013527700403760312, "1": 0}, "score": 4.333342335159414}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9237806890733655, "5": 0.07582853545394344, "3": 0.0003197308531456132, "2": 7.023554753181739e-05, "1": 0}, "score": 4.075368394484193}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7310451327720711, "4": 0.2689364695365629, "3": 1.6175221883334822e-05, "2": 1.5767339036762888e-06, "1": 0}, "score": 4.731026276132056}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9558217282936081, "5": 0.043328961965603756, "3": 0.0007225790732656091, "2": 0.00012556537734651404, "1": 0}, "score": 4.042355301493862}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9687263563120329, "2": 0.014481287213726391, "3": 0.012005408768912698, "5": 0.0047754216752288435, "1": 8.79656723073921e-06}, "score": 3.9637809499186187}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8413805283998663, "2": 0.117483027810141, "3": 0.03583029909809518, "5": 0.0052431312097706816, "1": 6.104123124952968e-05}, "score": 3.7342631286978674}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.945460016485907, "5": 0.048565897107174426, "3": 0.0033569961763262675, "2": 0.002614431250890609, "1": 1.4235824660686276e-06}, "score": 4.039975817067683}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9016957426121088, "5": 0.09805485617786897, "3": 0.00019837467845773435, "2": 5.01569735191501e-05, "1": 0}, "score": 4.097756252557108}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9828862792143185, "5": 0.014465164042044336, "3": 0.0023613731167741, "2": 0.00028646720387567225, "1": 1.9412539901999142e-07}, "score": 4.0115302801635595}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8760695379279291, "3": 0.061509724175130454, "4": 0.05688719540462551, "1": 0.0054592983762543346, "5": 6.872242450417852e-05}, "score": 2.170031922745472}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9491489006434598, "5": 0.05030304836675254, "3": 0.00047057039156584443, "2": 7.68185047168262e-05, "1": 0}, "score": 4.049678873857813}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8907931841579974, "5": 0.10311679511641986, "3": 0.00474806553346268, "2": 0.001339253379204154, "1": 1.5437932820618655e-06}, "score": 4.0956857022506235}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8266959547382207, "4": 0.1732848858248796, "3": 1.6142290349767584e-05, "2": 2.635156460328396e-06, "1": 0}, "score": 4.8266748579165535}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9899808178008056, "2": 0.0057953755408613, "3": 0.0034605767951688977, "5": 0.0007601878379685055, "1": 1.5140914528267933e-06}, "score": 3.98570429584383}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8734053870872664, "5": 0.12582597216793354, "3": 0.00041969575585755784, "2": 0.00034794000238264777, "1": 0}, "score": 4.124710521739709}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6922110806746226, "5": 0.3071667866276734, "3": 0.0004618067705196947, "2": 0.00015959598977297387, "1": 2.1508339506565665e-07}, "score": 4.306385300371125}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9801847271392448, "5": 0.013134481911237124, "3": 0.004756994108611338, "2": 0.001921999362730324, "1": 8.812812697898329e-07}, "score": 4.004530849384507}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6001652170026345, "4": 0.39979622467277715, "3": 2.6825020640437427e-05, "2": 1.1537297612511188e-05, "1": 0}, "score": 4.600115435013196}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6370244761823795, "5": 0.3629656054619327, "3": 7.19897430305057e-06, "2": 2.411354343619308e-06, "1": 0}, "score": 4.362953695578494}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9923394569762004, "3": 0.0038097565100846612, "5": 0.0032081366283504133, "2": 0.0006416676932767247, "1": 0}, "score": 3.9981150428803227}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9940973465160712, "5": 0.004977661881016367, "3": 0.0006133682918942431, "2": 0.000308420946090523, "1": 1.1123396145451752e-06}, "score": 4.0037441225034085}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6653909608670666, "4": 0.33457958682038774, "3": 2.543829098529234e-05, "2": 3.722444432379997e-06, "1": 0}, "score": 4.6653582716904705}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5621694680336518, "5": 0.43781802192344305, "3": 1.0152130226145057e-05, "2": 2.0625303576196627e-06, "1": 0}, "score": 4.437803874052027}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.890162418686123, "5": 0.1096895254337017, "3": 0.00012644210785036497, "2": 2.0966156824880527e-05, "1": 0}, "score": 4.109521221939842}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9608640300533464, "2": 0.023314670065284506, "3": 0.010185430114536459, "5": 0.0056249287367169725, "1": 1.0042615195295727e-05}, "score": 3.9487799846291987}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8624726333752595, "5": 0.13646299500166095, "3": 0.0009636070219942056, "2": 9.998883782063587e-05, "1": 2.328312254835002e-07}, "score": 4.135298785268394}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9663023133026225, "5": 0.03010606597869069, "3": 0.0033254396102657827, "2": 0.00026457018292272286, "1": 5.609388158653981e-07}, "score": 4.026249830748105}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7930267383071701, "5": 0.2068733931772515, "3": 9.19378272615482e-05, "2": 7.546716424248429e-06, "1": 0}, "score": 4.206766441309643}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9646818993162043, "5": 0.03405743550619268, "3": 0.0007179705546455211, "2": 0.000541952607708452, "1": 4.715658895960019e-07}, "score": 4.032254153761577}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9363353226186873, "5": 0.039255779389536546, "2": 0.01314903903782629, "3": 0.011246969099587605, "1": 1.1621461963961094e-05}, "score": 4.001675869954065}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8641214611705715, "2": 0.11334807329631676, "3": 0.022319558993945506, "5": 0.00011896669237968099, "1": 8.980077072582706e-05}, "score": 3.750833325807155}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8108794983001181, "5": 0.18667504518662534, "3": 0.0020416219775621536, "2": 0.0004020192037354631, "1": 1.0281381631611074e-06}, "score": 4.183826445094139}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7057546098671614, "5": 0.294202315602827, "3": 4.0503871331012545e-05, "2": 2.5491820881251185e-06, "1": 0}, "score": 4.2941567196848025}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9655275529762891, "5": 0.03408728970839921, "3": 0.0003502177689377828, "2": 3.467623416635811e-05, "1": 0}, "score": 4.033667728336253}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7486000475449414, "5": 0.2430348573607402, "3": 0.004181646125667349, "2": 0.004181646125667349, "1": 1.092490069194644e-06}, "score": 4.2304868052405045}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6513151842138138, "4": 0.34862389591839527, "3": 4.3023610997584997e-05, "2": 1.7656854377028772e-05, "1": 0}, "score": 4.651237002801774}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8438903414663645, "4": 0.15610401985478153, "3": 4.795378098876722e-06, "2": 8.333117625777066e-07, "1": 0}, "score": 4.84388388789429}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7431630352530936, "4": 0.25683028034541355, "3": 4.9371861219286826e-06, "2": 1.653750200959158e-06, "1": 0}, "score": 4.7431548600256646}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.912069176827379, "3": 0.05651273319148049, "4": 0.031209295370404146, "1": 0.0002006569147692282, "5": 0}, "score": 2.1187316332194523}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8668109731679743, "5": 0.13292977469748346, "3": 0.00016829199866417882, "2": 9.008021561330436e-05, "1": 3.6813725233913717e-07}, "score": 4.132580285708173}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.851937339538503, "5": 0.1480445110642865, "3": 1.2754619987916715e-05, "2": 5.073437308300906e-06, "1": 0}, "score": 4.148021657134949}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8590669848527853, "5": 0.1402388273697933, "3": 0.0004605180990504988, "2": 0.00023156313505497575, "1": 6.923612361324864e-07}, "score": 4.139313302931302}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7548292305641279, "5": 0.24505718193913584, "3": 8.481713261657814e-05, "2": 2.796972172087321e-05, "1": 0}, "score": 4.244916621453709}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6925562616228876, "5": 0.30731997817496504, "3": 7.197145326490747e-05, "2": 5.024417189201537e-05, "1": 6.62834169144671e-07}, "score": 4.307145800699014}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8869625132207222, "2": 0.07996208453239212, "3": 0.025959888038558036, "5": 0.00698700907899631, "1": 0.00012598760863696134}, "score": 3.8207245378200576}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.915933446140055, "3": 0.05675216349995935, "2": 0.025983033802998694, "5": 0.0013139906166540136, "1": 1.6284269133160567e-05}, "score": 3.8925467904742557}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9453819058061416, "3": 0.0264026366687668, "5": 0.021215114568264668, "2": 0.006996005049894988, "1": 3.361773149905202e-06}, "score": 3.9808103637486068}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9784633442624673, "3": 0.01193807985636262, "5": 0.00600284353211792, "2": 0.003584461591110225, "1": 1.0226563072421534e-05}, "score": 3.986865147088971}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9692792935340009, "5": 0.020755321652630335, "3": 0.007517081610909427, "2": 0.002440439092315824, "1": 6.962638922135373e-06}, "score": 4.008336481455421}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.743027100872672, "5": 0.24888289359345, "3": 0.006950803601322839, "2": 0.0011346874958647665, "1": 3.7847792314570136e-06}, "score": 4.239651535526233}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9815546094953547, "3": 0.009473635016259628, "5": 0.004763642844346589, "2": 0.004203900055155137, "1": 2.985500958224335e-06}, "score": 3.986873235107207}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9348817857870539, "3": 0.041075842664684045, "2": 0.023041459472501753, "5": 0.000996675816355491, "1": 2.0481266743292154e-06}, "score": 3.9138315812787074}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5774682768248629, "4": 0.42248481654595554, "3": 4.1245151148831355e-05, "2": 5.243732521199263e-06, "1": 0}, "score": 4.577416785421942}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9417665772155039, "5": 0.028438887279667698, "3": 0.018650677620751514, "2": 0.011136826047779682, "1": 5.696702837794324e-06}, "score": 3.987497450762272}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt4", "target_model": "human", "scores": {"4": 0.982502013379106, "5": 0.009632109713108588, "3": 0.00420795709354338, "2": 0.003655936478978521, "1": 1.5995671445114338e-06}, "score": 3.9981074802338856}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9315542790994475, "5": 0.06748155349550053, "3": 0.0008902341855671017, "2": 7.307487189722327e-05, "1": 0}, "score": 4.066445226599238}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9128368691329779, "5": 0.08490706275670051, "3": 0.0020602086807012332, "2": 0.0001946469798160858, "1": 0}, "score": 4.082457660092142}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9399763468125993, "5": 0.05824187973179157, "3": 0.0016265800453703183, "2": 0.0001536781619219628, "1": 3.0134049467209493e-07}, "score": 4.056307107692732}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6991586188214474, "5": 0.30070438694058793, "3": 0.00012359468691366637, "2": 1.3026784160666837e-05, "1": 0}, "score": 4.30055485072225}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8627852242167666, "2": 0.06972374115916095, "3": 0.056024599943438905, "5": 0.011382084441108537, "1": 8.163805862573059e-05}, "score": 3.815664588052487}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8181179905951687, "3": 0.09470403229726744, "2": 0.07974879078521284, "5": 0.006968369588563022, "1": 0.00043856654573656996}, "score": 3.751445525699866}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6785323785938866, "5": 0.32051599418923526, "3": 0.0007700362240517787, "2": 0.00018006403866215897, "1": 8.338619298762467e-07}, "score": 4.3193835496643285}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9408047302016697, "2": 0.03373752026403108, "3": 0.02111240070494151, "5": 0.004092824338233967, "1": 0.00024198253592761927}, "score": 3.9147785370966037}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9856760204883843, "3": 0.013208064354344592, "4": 0.0008988200593304442, "1": 0.00021348862615358144, "5": 0}, "score": 2.014792269194753}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8389721058237352, "2": 0.10834302801014767, "3": 0.05117762265467665, "5": 0.001474660330672033, "1": 2.7434670437761706e-05}, "score": 3.7335273057069673}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8264949267280252, "5": 0.1732427480648063, "3": 0.0001876023490278737, "2": 7.346613545710005e-05, "1": 0}, "score": 4.172908430742811}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.847765707237495, "5": 0.15199601128898665, "3": 0.0001752098779601939, "2": 6.24730059074972e-05, "1": 0}, "score": 4.151695946202835}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7122291638613099, "4": 0.28776658390750887, "3": 2.654232559120508e-06, "2": 1.4207083112164586e-06, "1": 0}, "score": 4.712223794482507}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5926567405174018, "5": 0.4073266237608134, "3": 1.3742532119167893e-05, "2": 2.7486793445022157e-06, "1": 0}, "score": 4.407307442730135}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7737298788799787, "2": 0.1263079381571773, "3": 0.09836872114494427, "5": 0.0014476949168508743, "1": 0.00014334116498603537}, "score": 3.6500322250331405}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8592552957907671, "5": 0.14026957109014138, "3": 0.00045347790983154694, "2": 2.1209422870764805e-05, "1": 0}, "score": 4.139773736643797}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9102746197978758, "5": 0.06697847365143653, "3": 0.019189653987510418, "2": 0.003549729058346461, "1": 4.783878207205823e-06}, "score": 4.040675121347257}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7426641168015923, "5": 0.25665787670316276, "3": 0.0006070577690600067, "2": 7.027207951402611e-05, "1": 2.1010971295746427e-07}, "score": 4.255909763837299}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5663322436967672, "3": 0.24357645552834747, "2": 0.18969753430323424, "5": 0.00024016148661400315, "1": 0.00014566530491355812}, "score": 3.3768266936403433}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt4", "target_model": "human", "scores": {"5": 0.7879272860250215, "4": 0.21206776694247303, "3": 4.339614667864609e-06, "2": 6.251807681429134e-07, "1": 0}, "score": 4.787921682053019}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9481540736363525, "4": 0.05184544488239668, "3": 2.1219970520486203e-07, "2": 7.929323665706735e-08, "1": 0}, "score": 4.948153882988326}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7121887317593535, "4": 0.28775026800476156, "3": 5.586692692685474e-05, "2": 4.958471648965916e-06, "1": 0}, "score": 4.71212307239481}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7122279744395994, "4": 0.287766094704732, "3": 5.036838270574716e-06, "2": 7.033002065117246e-07, "1": 0}, "score": 4.712221666833832}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6224481420855931, "4": 0.3775338671547227, "3": 1.2154087803865155e-05, "2": 5.309727724573197e-06, "1": 0}, "score": 4.622425696525923}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9782478027469402, "5": 0.012314325740308565, "3": 0.004975437363372285, "2": 0.004459953228002984, "1": 1.9210896631881197e-06}, "score": 3.99841321776361}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9857676384037563, "5": 0.013209292761449587, "3": 0.0005537984755166394, "2": 0.00046634507200830774, "1": 0}, "score": 4.011722838434587}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9537629724077059, "5": 0.04602409570337827, "3": 0.00013977661735308972, "2": 7.251515380100178e-05, "1": 0}, "score": 4.045739318056973}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6297693107922647, "4": 0.37022227887793413, "3": 7.342905125343238e-06, "2": 8.110784946743468e-07, "1": 0}, "score": 4.629760507166851}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8669088069750639, "5": 0.13294475672731337, "3": 0.00011038117002900434, "2": 3.583551919981778e-05, "1": 0}, "score": 4.132762733674695}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt4", "target_model": "human", "scores": {"5": 0.8351786875161914, "4": 0.16445643116452469, "3": 0.00030770777741157153, "2": 5.603774928240463e-05, "1": 0}, "score": 4.83475985235427}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9449922269235014, "4": 0.05500514239661887, "3": 2.135992816358553e-06, "2": 3.0771894093903166e-07, "1": 0}, "score": 4.944989652175744}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9018886585078779, "4": 0.09807586177768171, "3": 2.858469852269361e-05, "2": 6.181874594792366e-06, "1": 0}, "score": 4.9018483532054935}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9802801429643974, "4": 0.019719115179657992, "3": 5.021876411220292e-07, "2": 1.7355140483021765e-07, "1": 0}, "score": 4.980279358486977}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.8267008322587422, "4": 0.173285908208722, "3": 1.0586435988396393e-05, "2": 1.9582937491626312e-06, "1": 0}, "score": 4.82668692015338}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9756168659677328, "5": 0.011537122489405924, "2": 0.009270338355653392, "3": 0.003574033818223273, "1": 1.0747365459015918e-06}, "score": 3.9894191817759648}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9336162335870752, "5": 0.0635333826625477, "2": 0.0016668577696488445, "3": 0.0011819791497018086, "1": 7.524441969125394e-07}, "score": 4.059015477522076}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9838264297690503, "5": 0.014478999351092533, "3": 0.0014561912278829561, "2": 0.00023771668322671206, "1": 0}, "score": 4.012547383075279}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774801843434971, "5": 0.4224935282726903, "3": 2.207740214398214e-05, "2": 3.836477231701088e-06, "1": 0}, "score": 4.422463935708237}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9912044164671721, "5": 0.004312082124440946, "3": 0.0026565967304337263, "2": 0.0018258504508982506, "1": 5.66473803650696e-07}, "score": 3.99800208409631}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt4", "target_model": "human", "scores": {"5": 0.5544208630779602, "4": 0.44548967880731294, "3": 7.398072290353823e-05, "2": 1.4567668079752999e-05, "1": 0}, "score": 4.554318251295372}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9089388398150449, "5": 0.08999712082472305, "3": 0.0007429717020810522, "2": 0.00031954833894123105, "1": 6.464777858235089e-07}, "score": 4.088613190356666}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8221844396162391, "4": 0.17780986033283908, "3": 4.123059801413188e-06, "2": 1.2574621937962643e-06, "1": 0}, "score": 4.822178064341723}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7371564940888676, "4": 0.26284126083401127, "3": 1.5171067362307904e-06, "2": 4.699777423809238e-07, "1": 0}, "score": 4.7371542272070135}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.76064872824979, "4": 0.23934872262683377, "3": 1.7463930697932763e-06, "2": 6.035372952850712e-07, "1": 0}, "score": 4.7606459262974825}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9835867299879174, "5": 0.009346067615787261, "3": 0.004346325080562166, "2": 0.00271986073595919, "1": 3.46312600541059e-07}, "score": 3.999558981829904}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.4999776407799223, "5": 0.4999776407799223, "3": 3.861221039650811e-05, "2": 5.829571846541422e-06, "1": 0}, "score": 4.499927507734734}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9043727721621031, "5": 0.09532018365813903, "3": 0.00027195117811587, "2": 3.457471235149169e-05, "1": 0}, "score": 4.0949791322819875}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9744695688227956, "5": 0.025169760126887764, "3": 0.00029764412396030655, "2": 6.238959770069317e-05, "1": 0}, "score": 4.024747352579723}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9578280534855492, "5": 0.04208402769280017, "3": 4.5572230828616255e-05, "2": 4.2147423597460685e-05, "1": 0}, "score": 4.041954168970673}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7822515147762947, "3": 0.12769904428957954, "2": 0.08776618405208154, "5": 0.0022317840297709835, "1": 5.0082996434754585e-05}, "score": 3.698849704091227}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8533892627835246, "2": 0.11549367643495564, "3": 0.030602777688791875, "5": 0.00048697912513478514, "1": 2.5808930048851095e-05}, "score": 3.738819031300931}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8328376947813096, "2": 0.10588344132779237, "3": 0.060330566291980484, "5": 0.0009304970985956949, "1": 1.6518295056661453e-05}, "score": 3.728783145510181}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9211485017863174, "5": 0.07801267230811343, "3": 0.000707332857622441, "2": 0.0001308434483721201, "1": 0}, "score": 4.077043702601303}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9921758502601922, "4": 0.00399193181934966, "3": 0.003634695283440516, "1": 0.0001956654979148628, "5": 0}, "score": 2.011422914638166}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt4", "target_model": "human", "scores": {"5": 0.718508171879678, "4": 0.2813718429213425, "3": 7.948414421754616e-05, "2": 3.9347504624144284e-05, "1": 0}, "score": 4.7183508213799}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6369418467267914, "4": 0.36291849558384104, "2": 7.269764989596866e-05, "3": 6.619196347825763e-05, "1": 0}, "score": 4.636730748521124}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8840178060118592, "4": 0.11595789823577739, "3": 1.6993952712271197e-05, "2": 6.866177577165278e-06, "1": 0}, "score": 4.883987464788445}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9875678092198148, "4": 0.012431641781517299, "3": 2.1759397734284998e-07, "2": 1.0119059694228875e-07, "1": 0}, "score": 4.987567616596627}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6368571900429324, "5": 0.3628703032076721, "3": 0.00017990439267332863, "2": 9.046160965183363e-05, "1": 0}, "score": 4.362510251638454}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8051101408427754, "4": 0.13990717667783772, "3": 0.054788437599506266, "1": 0.0001337014805827955, "5": 5.9329672362473234e-05}, "score": 2.334647484662353}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9512985480982481, "3": 0.024571275030555086, "2": 0.020691088058287475, "5": 0.0034309194242742426, "1": 7.050387345678195e-06}, "score": 3.937456247128567}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9240729539184455, "3": 0.035830198773398145, "5": 0.033659356770933596, "2": 0.0064240019422175275, "1": 1.2996389108110794e-05}, "score": 3.9849421575342174}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8669690072127483, "5": 0.13295398341359257, "3": 7.016738191492679e-05, "2": 6.629361918178895e-06, "1": 0}, "score": 4.132870585560091}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9133193852580654, "2": 0.051525955911261384, "3": 0.03275189028305381, "5": 0.002029340125707757, "1": 0.0003526464362464589}, "score": 3.8651647965681266}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5643994406818402, "4": 0.40021913275170257, "3": 0.03442858845511531, "5": 0.000889262580429418, "1": 5.774389086762953e-05}, "score": 2.837481781701235}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8594278343896263, "5": 0.140297740048085, "3": 0.000217624817168074, "2": 5.589067541699534e-05, "1": 0}, "score": 4.139968461261138}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6612769569410735, "2": 0.2080800120357098, "3": 0.13021314425027808, "5": 0.00037150163230268606, "1": 5.1873214462800576e-05}, "score": 3.453839157108129}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.54670638171073, "4": 0.4532355095332439, "3": 4.5651732492523106e-05, "2": 1.2096504879760153e-05, "1": 0}, "score": 4.546636734041218}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5926488582351702, "4": 0.40732120635274327, "3": 1.937982464089541e-05, "2": 9.593708873378104e-06, "1": 0}, "score": 4.592610861012472}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8967177378197776, "3": 0.04678750962660348, "5": 0.04327137275150599, "2": 0.013197023067682586, "1": 2.4309593288259257e-05}, "score": 3.9700168268298857}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9851332596263627, "5": 0.011116181938193387, "3": 0.002559090390094038, "2": 0.0011900875537325572, "1": 1.102309537115661e-06}, "score": 4.00617361122941}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9313102159090304, "5": 0.06746387564438434, "3": 0.0011250669882358038, "2": 9.985534192841983e-05, "1": 2.93933290034218e-07}, "score": 4.066138261952211}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9589334765720406, "5": 0.040836315813588535, "3": 0.00021428921144195514, "2": 1.552305841191657e-05, "1": 0}, "score": 4.0405909965327504}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.973195354025109, "3": 0.014548088042687783, "2": 0.010981472987843483, "5": 0.0012711977661752979, "1": 3.1021349188712002e-06}, "score": 3.96475082967092}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9304113535336279, "5": 0.04217707297539421, "2": 0.018425798573511953, "3": 0.008980018828098636, "1": 4.18238876406654e-06}, "score": 3.9963329040630686}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6512657252167066, "5": 0.3485974363688477, "3": 0.00012644375160845132, "2": 1.0059802758457997e-05, "1": 0}, "score": 4.348450989694048}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6581856596058826, "5": 0.3414622321787959, "3": 0.0003065459179324513, "2": 4.485757892054223e-05, "1": 0}, "score": 4.341066211458681}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5467238547259068, "5": 0.45324999517160786, "3": 2.224961172647037e-05, "2": 3.5758380132041255e-06, "1": 0}, "score": 4.453220741023213}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7771901152282238, "5": 0.2226686916318361, "3": 0.0001103950789326705, "2": 3.0180335139430363e-05, "1": 0}, "score": 4.22249807332544}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9722319891833473, "2": 0.017807047020566708, "3": 0.007658715489171328, "5": 0.002299563400352389, "1": 1.5828461035757776e-06}, "score": 3.9590219601714596}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8630221344204354, "5": 0.13654993596658888, "3": 0.00033322587320865657, "2": 9.399067337798278e-05, "1": 0}, "score": 4.136028825744208}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8975680273516706, "5": 0.1007043482451187, "3": 0.001577653598475724, "2": 0.00014905547587566615, "1": 2.8774475993156923e-07}, "score": 4.098827782483358}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9622870442764302, "5": 0.03731192120662054, "3": 0.0003228111760357706, "2": 7.78818206578874e-05, "1": 0}, "score": 4.036833358968607}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9608247488130232, "4": 0.02259643338457011, "3": 0.016531903822603156, "1": 4.5006033473167356e-05, "5": 0}, "score": 2.0616798822401754}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7308659609493218, "5": 0.26887056128526565, "3": 0.00018507026392381752, "2": 7.714876400171717e-05, "1": 0}, "score": 4.268531531504044}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8078887545113674, "5": 0.19189040062845347, "2": 0.00014966950420745425, "3": 7.069886775293196e-05, "1": 1.836551541509414e-07}, "score": 4.191519867870173}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9785712101358928, "5": 0.008599623979435676, "2": 0.006909991992714316, "3": 0.005910429362699895, "1": 4.907298358873033e-06}, "score": 3.9888544459681663}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6076541324383381, "4": 0.39233100303325213, "3": 1.2052059497209686e-05, "2": 2.2294068375599696e-06, "1": 0}, "score": 4.607637975855825}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8870741231874812, "5": 0.11277881137308148, "3": 0.00011472747782098294, "2": 3.087848175442598e-05, "1": 4.4739408894120585e-07}, "score": 4.112601098711456}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5317106917819769, "2": 0.41409670312724206, "3": 0.04433278978466197, "5": 0.009738621510888798, "1": 0.00011697726012060713}, "score": 3.136857854222219}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9267285014577261, "2": 0.06306466818077952, "3": 0.008944471920870424, "5": 0.0012489281194189928, "1": 1.1148339443313004e-05}, "score": 3.866141369355706}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6063478182834606, "5": 0.3914875753774836, "3": 0.0012076832791263457, "2": 0.0009553561070741317, "1": 4.811070665646441e-07}, "score": 4.388368158270939}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5467279770393125, "4": 0.45325341268945546, "3": 1.2287488603238313e-05, "2": 6.082747941674521e-06, "1": 0}, "score": 4.546703655282667}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5234049455703453, "5": 0.47656562613935227, "3": 1.8219374447672345e-05, "2": 1.0879285387386256e-05, "1": 0}, "score": 4.476525805271554}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.895553720400827, "5": 0.10366785422396367, "3": 0.00045809315469563447, "2": 0.00031980056206959564, "1": 2.573540689538089e-07}, "score": 4.102569416018163}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6653662553593502, "4": 0.3345671406912574, "3": 5.4698897726043944e-05, "2": 1.1465511827992101e-05, "1": 0}, "score": 4.665288917858952}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9603139295773094, "5": 0.03723541330407393, "3": 0.0019428098062935358, "2": 0.0005068122188506574, "1": 0}, "score": 4.034279014542063}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5233747459762527, "5": 0.47653812909602133, "3": 7.670205939128141e-05, "2": 1.0061120678941277e-05, "1": 0}, "score": 4.47644147714686}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8434026463147577, "5": 0.1560138178022099, "3": 0.00044511138666823735, "2": 0.00013788907505223622, "1": 1.6657652891528933e-07}, "score": 4.155292485814675}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9561642481497149, "5": 0.043344493848719426, "3": 0.00035228304513099795, "2": 0.00013795596747373745, "1": 2.3872561474396073e-07}, "score": 4.042715616021226}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9929434551623957, "5": 0.003995020773110785, "3": 0.001947017625476547, "2": 0.0011093772024449212, "1": 1.426613648493676e-06}, "score": 3.9998249682537215}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9942953049226164, "3": 0.0028367507043457517, "5": 0.0017205762761471062, "2": 0.0011461508930833946, "1": 4.0928831606305754e-07}, "score": 3.9965902931659314}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9668346750515452, "5": 0.03308326875747385, "3": 5.636128902056916e-05, "2": 2.5404023270672813e-05, "1": 0}, "score": 4.032976109013959}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9939490409397047, "5": 0.0034744502983622564, "3": 0.0024255572188966235, "2": 0.00015028996949387904, "1": 0}, "score": 4.000748313635543}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt4", "target_model": "human", "scores": {"5": 0.8434626902863886, "4": 0.15602491077900632, "3": 0.0004451432577844952, "2": 6.616466492403666e-05, "1": 5.051734506543187e-07}, "score": 4.8428841959723705}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8633839114340789, "4": 0.1366071623778548, "3": 7.250827193144215e-06, "2": 1.5437901944783885e-06, "1": 0}, "score": 4.863373686621158}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5073133596218438, "4": 0.4917049684393404, "3": 0.0006944596477845072, "2": 0.00028500580770242644, "1": 1.1289178939732374e-06}, "score": 4.506046046902702}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6859411926025669, "4": 0.3140467559059284, "3": 8.513656812330386e-06, "2": 3.0356378220408155e-06, "1": 0}, "score": 4.68592695214048}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6722647317357576, "5": 0.3276356536662614, "3": 6.562997699528738e-05, "2": 3.352051226829947e-05, "1": 0}, "score": 4.327503134661789}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9592626678001254, "5": 0.025563480217434358, "2": 0.010656449321674605, "3": 0.004512224544303296, "1": 3.306183681719848e-06}, "score": 3.9997284379703903}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.8633759079023163, "3": 0.08819939283059022, "4": 0.039754580969746954, "1": 0.008597532805180974, "5": 4.3049712732205944e-05}, "score": 2.15924487452459}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9735357730536381, "5": 0.018396944278119203, "3": 0.006457934817449169, "2": 0.001607507075993467, "1": 1.1595877545714335e-06}, "score": 4.008720522485726}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9824760127898653, "5": 0.010914326445002303, "3": 0.0038916229405164715, "2": 0.0027167906592426546, "1": 8.042915573364785e-07}, "score": 4.001586710014041}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7864680345241113, "2": 0.1324628434069838, "3": 0.08034277579904914, "1": 0.0005246897617713007, "5": 0.00018418350270796126}, "score": 3.6533355943353527}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8997248451618324, "5": 0.08368743769725248, "3": 0.015724409952391747, "2": 0.0008598169845727746, "1": 1.8808420170157367e-06}, "score": 4.066237857850351}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7427275133163271, "5": 0.256679770553805, "3": 0.000570326816023393, "2": 2.1433595151432605e-05, "1": 0}, "score": 4.2560668212753265}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8353396252499453, "4": 0.16448812497241042, "3": 0.00016733010833914745, "2": 4.3900629130016815e-06, "1": 0}, "score": 4.835163957323951}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9144913453512409, "5": 0.08244390139712451, "3": 0.002412992983824793, "2": 0.0006494482511055817, "1": 9.917825076699255e-07}, "score": 4.0787291405044686}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.47694695487042027, "2": 0.4622728397427004, "3": 0.060637000677153385, "5": 7.557764647868925e-05, "1": 5.794739162364921e-05}, "score": 3.014709518020734}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9332380649169999, "5": 0.06552359317845645, "3": 0.0009643126405591931, "2": 0.00027199686975178306, "1": 1.0773890393423082e-06}, "score": 4.0640121157631794}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6001484726266652, "5": 0.39978507051371004, "3": 5.503985493341993e-05, "2": 1.0669962576647653e-05, "1": 0}, "score": 4.399708989333073}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6512615310789412, "5": 0.3485951704928754, "3": 0.00012255275103207068, "2": 1.9696019469942415e-05, "1": 0}, "score": 4.348433591438899}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7548910309629989, "4": 0.2450772529442331, "3": 2.7111379783751196e-05, "2": 4.093206130528628e-06, "1": 0}, "score": 4.754856119285034}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8437886419309482, "5": 0.1560852104536782, "3": 0.00010912920617372739, "2": 1.5721552756224074e-05, "1": 0}, "score": 4.155944840380063}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7653948304986131, "5": 0.22625029331116558, "3": 0.00469567456183612, "2": 0.003656995025806446, "1": 1.4120203596240124e-06}, "score": 4.214236562865201}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6925130820861115, "4": 0.30730080200662957, "3": 0.00011146465643048102, "2": 7.425146870042437e-05, "1": 1.0324324819788809e-07}, "score": 4.692253010042468}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5533765427728213, "4": 0.444650543867972, "3": 0.0012489313666363248, "2": 0.0007228260207235142, "1": 7.468944203666759e-07}, "score": 4.550679943952211}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8990021616575534, "4": 0.10086524105713024, "3": 7.390574447100373e-05, "2": 5.846425594242822e-05, "1": 1.0116934914802709e-07}, "score": 4.898811137247215}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7490279198435826, "4": 0.25089293114506966, "3": 4.648043902522375e-05, "2": 3.244857595696743e-05, "1": 4.8028127888069095e-08}, "score": 4.748916526958116}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9873699609421307, "3": 0.007900449676919946, "5": 0.002730322349543279, "2": 0.001997546502988179, "1": 4.326503244416153e-07}, "score": 3.9908334699103003}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9923193929683246, "3": 0.006183718434648556, "2": 0.0009336018457214884, "5": 0.0005574791245970712, "1": 2.1739603667439413e-06}, "score": 3.9925000078649364}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9644892368538178, "5": 0.016337671545170088, "3": 0.015347822065488804, "2": 0.0038203749757119796, "1": 4.009748647627533e-06}, "score": 3.9933370643868744}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.877351340964692, "5": 0.12250570238489517, "3": 0.0001368708195445778, "2": 5.390631599706261e-06, "1": 0}, "score": 4.122358135365438}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9920362202649138, "5": 0.004182920467377941, "3": 0.003414000186438163, "2": 0.00036549951709237714, "1": 4.774191551243769e-07}, "score": 4.000036489021478}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9075184014217024, "5": 0.08985649331248755, "2": 0.0014752665406355529, "3": 0.001148938737086011, "1": 4.1028409605378053e-07}, "score": 4.085755832636817}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5544618584721572, "4": 0.44552261953196753, "3": 1.3059339626251142e-05, "2": 2.1318785895976533e-06, "1": 0}, "score": 4.554444718773279}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5621692600309871, "5": 0.43781785993080496, "3": 9.100301619415849e-06, "2": 3.5084788166323463e-06, "1": 0}, "score": 4.437801861428711}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8221858948839852, "4": 0.17781018039087573, "3": 3.0640040018498995e-06, "2": 8.118802362221915e-07, "1": 0}, "score": 4.822181247275584}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6926340400582454, "5": 0.30735449214643734, "3": 1.0867292151089703e-05, "2": 4.556102991245212e-07, "1": 0}, "score": 4.307342758165461}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9497184440494466, "5": 0.03799351848454513, "3": 0.00808928849889541, "2": 0.004196667588229548, "1": 1.322528663136069e-06}, "score": 4.02150694354375}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7185651087230256, "4": 0.28139415659321154, "3": 3.754861742522113e-05, "2": 2.941034993380279e-06, "1": 0}, "score": 4.7185218540959895}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7545290192122063, "5": 0.24495971757910692, "3": 0.0004583344042449524, "2": 5.2233474220947646e-05, "1": 0}, "score": 4.2443970861631}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8354732234450423, "4": 0.1645144287265226, "3": 1.1038382947391339e-05, "2": 1.1634370030719536e-06, "1": 0}, "score": 4.835459980172334}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9885949009223827, "5": 0.009104640958711658, "3": 0.002096007362261853, "2": 0.0002043153345450132, "1": 0}, "score": 4.006600003821146}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8666316918609829, "5": 0.13290226108187853, "3": 0.00032943186777013254, "2": 0.0001351985661244551, "1": 0}, "score": 4.132302619504825}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.569815326070175, "4": 0.43011917393804733, "3": 4.332338497646215e-05, "2": 2.1784366030757018e-05, "1": 0}, "score": 4.569728657423944}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8670084378598425, "4": 0.1329600462534679, "3": 2.2080139911586066e-05, "2": 9.204371718327809e-06, "1": 0}, "score": 4.866968149571302}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8807946831317333, "4": 0.11920260149101364, "3": 1.411749277739658e-06, "2": 1.2458643648312878e-06, "1": 0}, "score": 4.880790830531384}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5466923862065015, "4": 0.4532239068527148, "3": 6.047720746657605e-05, "2": 2.2954558815178952e-05, "1": 0}, "score": 4.546586150287976}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8498168952979014, "5": 0.14767602867644944, "3": 0.0020100222245142837, "2": 0.0004925771302349619, "1": 2.584808846328027e-06}, "score": 4.144673371466987}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6150525670194563, "5": 0.3848900769026346, "3": 4.9006971228679943e-05, "2": 7.876137021439812e-06, "1": 0}, "score": 4.384825499668148}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8883500039977722, "5": 0.09967011462084223, "2": 0.006079914777261976, "3": 0.0058928554649061455, "1": 3.6932120658811537e-06}, "score": 4.081606628890727}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6441676246647471, "5": 0.35574314903679943, "3": 7.94966242078419e-05, "2": 9.05973217141785e-06, "1": 0}, "score": 4.355645771210315}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9556933452069196, "5": 0.030720714884303793, "3": 0.009224032247302226, "2": 0.0043571243150301074, "1": 2.9991129390605385e-06}, "score": 4.012773459458959}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9813380484565132, "3": 0.008759745736226556, "2": 0.007975839255888855, "5": 0.0019242607711154396, "1": 1.4099405747919062e-06}, "score": 3.977208590842221}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6149756964032338, "5": 0.3848419455593328, "3": 0.00015817666763695326, "2": 2.3510862724971984e-05, "1": 0}, "score": 4.384637005068079}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.817255903326842, "5": 0.18235444241511234, "3": 0.000335906402767153, "2": 5.314811071990041e-05, "1": 0}, "score": 4.1819123488918475}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6513490144030444, "5": 0.34864202483233075, "3": 6.914879630588469e-06, "2": 1.7212496332077675e-06, "1": 0}, "score": 4.348631780631639}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8705751446063602, "5": 0.12939943024209893, "3": 2.1827258049210258e-05, "2": 3.4000310297049337e-06, "1": 0}, "score": 4.129370828519621}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7640537185875809, "5": 0.2330232371806792, "3": 0.002629418920446308, "2": 0.0002904389960820003, "1": 1.1150436565078317e-06}, "score": 4.229810071136162}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7667948071027882, "3": 0.12132456125208657, "2": 0.11046727010991143, "5": 0.0013477941309531965, "1": 6.205986960860405e-05}, "score": 3.6589013166347666}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8765518680897952, "5": 0.11144106420254109, "3": 0.009890954760889331, "2": 0.0021059057907665928, "1": 6.198922942225549e-06}, "score": 4.097320091172899}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8518228894452932, "5": 0.1480246152190302, "3": 0.0001414588069818113, "2": 1.0247241608117485e-05, "1": 0}, "score": 4.147862778635014}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.960363843190918, "5": 0.03841938995831838, "3": 0.001072977269093701, "2": 0.00014296038415020514, "1": 2.8922294796500324e-07}, "score": 4.037059644263347}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt4", "target_model": "human", "scores": {"2": 0.6736605701770627, "3": 0.17573487706289365, "4": 0.15031400594069041, "1": 0.00022248430459326265, "5": 6.576623481809541e-05}, "score": 2.476338797151361}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6297446872936053, "4": 0.37020780346982607, "3": 3.847255223062481e-05, "2": 8.719571161323548e-06, "1": 0}, "score": 4.629688975281723}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7646910140110655, "5": 0.23321758965808978, "3": 0.001547045339198583, "2": 0.0005430639898206173, "1": 8.293206212066152e-07}, "score": 4.23058203391045}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5467142543393095, "4": 0.4532420361715729, "3": 3.6682747822847286e-05, "2": 6.474889604643012e-06, "1": 0}, "score": 4.54666492349024}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9649763120913798, "3": 0.01355124708632942, "2": 0.0112343784222244, "5": 0.010229017957099594, "1": 6.718457288151778e-06}, "score": 3.974188798617972}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt4", "target_model": "human", "scores": {"2": 0.41890917444157455, "4": 0.3696860489089595, "3": 0.21064075067892332, "5": 0.0004680310116652585, "1": 0.0002928863230991786}, "score": 2.9511270119161983}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6369003322101946, "4": 0.3628948703587879, "3": 0.00016381595269289705, "2": 4.014482570394091e-05, "1": 0}, "score": 4.63665675926664}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7176544809952907, "5": 0.2810375187156975, "3": 0.0012036556235028712, "2": 0.0001035436805490433, "1": 0}, "score": 4.2796269997081176}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7879208408061827, "4": 0.21206600678731208, "3": 1.0574046527299204e-05, "2": 2.114942357446174e-06, "1": 0}, "score": 4.787906402004651}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7057637423909003, "4": 0.29420611083717746, "3": 2.7838252329203634e-05, "2": 2.016596234985696e-06, "1": 0}, "score": 4.705732076965779}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8509467123962986, "5": 0.14787236144312568, "3": 0.0007639328999082676, "2": 0.000415343113420844, "1": 0}, "score": 4.146277983696588}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6076113064842882, "5": 0.39230334467250694, "3": 5.9318193181517675e-05, "2": 2.5512436979822633e-05, "1": 0}, "score": 4.392193204845}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9690496451682403, "5": 0.027063630511363172, "3": 0.002943033873332685, "2": 0.0009406501244547147, "1": 8.712690586904015e-07}, "score": 4.022236730814605}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7718313896506203, "4": 0.22815293667643055, "2": 8.999297853043383e-06, "3": 5.8103833977031535e-06, "1": 0}, "score": 4.771808247507434}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5926416575952866, "5": 0.4073162574301508, "3": 2.8641151805729475e-05, "2": 1.2709434071416318e-05, "1": 0}, "score": 4.407262496499174}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9849132605922714, "5": 0.013616791209956887, "2": 0.0007803042891972565, "3": 0.0006886161182900533, "1": 6.478692083062111e-07}, "score": 4.0113656272236895}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9850877977605821, "2": 0.008390545858596539, "3": 0.006138654485542747, "5": 0.0003803572177882328, "1": 1.875005434773938e-06}, "score": 3.977454968646467}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9631583525442611, "5": 0.03096067896831346, "3": 0.0035283935380223965, "2": 0.002350416811401093, "1": 1.3204499608768981e-06}, "score": 4.0227275094961685}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5698208874948972, "4": 0.43012337192167116, "3": 4.2652144667654684e-05, "2": 1.2412481736173834e-05, "1": 0}, "score": 4.5697537955158385}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9783276603744232, "5": 0.02030454147449717, "3": 0.0009646109485898764, "2": 0.0004021096682331777, "1": 4.422962192676622e-07}, "score": 4.0185343960745366}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7815375200283979, "5": 0.21702513557648553, "3": 0.0010369288121184939, "2": 0.0003997716695358285, "1": 2.883784952566698e-07}, "score": 4.215187874796623}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9353669423231088, "5": 0.04109715834066674, "3": 0.02132092487493364, "2": 0.0022123692032606627, "1": 1.725590926597255e-06}, "score": 4.015346331786096}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8997620945414789, "5": 0.09483421662306636, "3": 0.0051855742046962045, "2": 0.00021740469225509264, "1": 1.6694106349863414e-07}, "score": 4.089213380653307}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7923532530735449, "5": 0.20669770818396102, "3": 0.0008060433764260132, "2": 0.0001422751072007082, "1": 1.5895844835177792e-07}, "score": 4.205606753124945}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8392371705856935, "5": 0.1601712057325738, "3": 0.0005342551628914068, "2": 5.71968632139036e-05, "1": 7.128984115300192e-08}, "score": 4.159522358984318}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9831115845345156, "3": 0.011994793480150158, "2": 0.00455271008616265, "5": 0.0003402660997971151, "1": 2.9148333575827675e-07}, "score": 3.9792391706414194}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9722714353798125, "5": 0.02758121648732372, "3": 0.00013178088193778118, "2": 1.5018241435612584e-05, "1": 0}, "score": 4.027419414176033}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8507385537471559, "5": 0.14783619628669561, "3": 0.0011645730963751944, "2": 0.00025985130354334694, "1": 0}, "score": 4.1461520412414234}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6370210362594959, "4": 0.3629636817493216, "3": 1.3876302900522524e-05, "2": 1.1390363044941942e-06, "1": 0}, "score": 4.637005051742643}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5620758914713694, "5": 0.43774514442346046, "3": 9.630474184786812e-05, "2": 8.237381093712159e-05, "1": 4.7005886424694724e-08}, "score": 4.43748405540237}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5386113638283383, "5": 0.4606987132852473, "3": 0.0005924399738766562, "2": 9.521376845464071e-05, "1": 0}, "score": 4.459916889392149}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6368994596573372, "4": 0.3628943623063251, "3": 0.00012173755729904947, "2": 8.366891795783836e-05, "1": 2.541050684867658e-07}, "score": 4.636609951366563}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.782248808190736, "5": 0.21722263144731108, "3": 0.000412837047901754, "2": 0.00011464066198421247, "1": 0}, "score": 4.2165807475570345}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7185773316194805, "4": 0.2813989121946427, "3": 2.13949210118489e-05, "2": 1.8119498995150314e-06, "1": 0}, "score": 4.718552707510425}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6790396896764641, "5": 0.32075563738679974, "3": 0.00018303649477598396, "2": 2.085952248651533e-05, "1": 0}, "score": 4.320531130873928}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7977891894929848, "2": 0.18949153985896003, "3": 0.012113791282706905, "5": 0.0005845544060689213, "1": 1.969223819721798e-05}, "score": 3.609428125224666}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9917167428042324, "3": 0.005369244872475385, "5": 0.002657968951262245, "2": 0.00025507753505071845, "1": 2.4760205413178706e-07}, "score": 3.996777823888244}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9607215156616098, "5": 0.031862650049784225, "3": 0.0063729328458221384, "2": 0.0010403526882508984, "1": 1.8286254382266723e-06}, "score": 4.023403542804717}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8396499669523172, "5": 0.16025001332981312, "3": 8.590487315709538e-05, "2": 1.380616950673193e-05, "1": 0}, "score": 4.160136545547823}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9136736209275957, "2": 0.07269141423300499, "3": 0.011866547167469864, "5": 0.0017364595153291581, "1": 2.7632125354508924e-05}, "score": 3.8444035143905277}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9731347297356797, "2": 0.012638815564427145, "3": 0.008160232644966292, "5": 0.006064169980195809, "1": 1.313443819944122e-06}, "score": 3.9726223456529337}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8591814545636498, "5": 0.14025752245148118, "3": 0.0004128606628562751, "2": 0.00014721006170961346, "1": 0}, "score": 4.139550374553488}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.97587984478414, "5": 0.020253742250695227, "3": 0.0033583986865229815, "2": 0.0005070423638369742, "1": 2.8485344984493927e-07}, "score": 4.015880415186968}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8668958121094441, "5": 0.1329427625709187, "3": 0.00011567662214170356, "2": 4.529961610565711e-05, "1": 0}, "score": 4.132736546326078}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7488838806452915, "5": 0.25084468907303437, "3": 0.0001753816678038694, "2": 9.53533588504256e-05, "1": 0}, "score": 4.250478774834155}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9558013599496036, "5": 0.025471247805629687, "2": 0.013214309282237309, "3": 0.005508543656049905, "1": 2.952952620093052e-06}, "score": 3.993525216455947}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8848411921274323, "5": 0.11249494406410146, "3": 0.0024088712552770993, "2": 0.00025389316237557126, "1": 5.467785287319988e-07}, "score": 4.109576706701921}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7597011854922335, "5": 0.2390505842174053, "3": 0.001160151127525852, "2": 8.670881559936518e-05, "1": 0}, "score": 4.237717341213982}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7057009392699313, "5": 0.2941799276584817, "3": 9.41671653789751e-05, "2": 2.456497279043715e-05, "1": 0}, "score": 4.29403674843668}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6385097585954158, "2": 0.2661704728759313, "3": 0.09490599534182856, "5": 0.0003878591111019887, "1": 2.0237100089914875e-05}, "score": 3.373076647688547}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9896673355692193, "2": 0.004044543864887964, "3": 0.003459481695921823, "5": 0.0028235466695975754, "1": 4.3118823890338395e-06}, "score": 3.9912620347783414}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8990506191799853, "5": 0.10087067784014322, "3": 7.276387124889499e-05, "2": 5.7890578489984585e-06, "1": 0}, "score": 4.100786350976267}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9576404161103363, "5": 0.04207578003166956, "3": 0.0002463129933666611, "2": 3.718769987064732e-05, "1": 0}, "score": 4.041755104297238}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9860788687383195, "5": 0.009667176477526133, "3": 0.0034469379250781584, "2": 0.0008060264496928393, "1": 3.582108705748981e-07}, "score": 4.004607113933061}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9761788582058373, "5": 0.019032458790569314, "3": 0.0039894200879873375, "2": 0.0007979342160021797, "1": 7.867463030719265e-07}, "score": 4.013444817318131}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8494098795163143, "4": 0.1186041857546978, "3": 0.031921883539874796, "1": 3.622670514209645e-05, "5": 2.5290316058246835e-05}, "score": 2.2691705814157532}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9879576692903104, "3": 0.006976272713741677, "2": 0.004870223255109978, "5": 0.00019181283098892776, "1": 2.0978123380768667e-06}, "score": 3.9834687683623113}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9722248996935304, "2": 0.012048766372649001, "3": 0.012048766372649001, "5": 0.0036746661278831993, "1": 2.0324004008438557e-06}, "score": 3.9675222415844935}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.95990887970415, "5": 0.03962016789849459, "3": 0.00033223566716739696, "2": 0.0001384964312246378, "1": 0}, "score": 4.03901094796295}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9804461655034438, "5": 0.014887286281060995, "3": 0.0031205447282887035, "2": 0.001544781658466719, "1": 8.28107384123407e-07}, "score": 4.0086746973291}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9755784069333112, "5": 0.015283598791057148, "3": 0.006079395574710264, "2": 0.0030569120699411173, "1": 8.239961330075118e-07}, "score": 4.003087909751804}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9042778171019287, "5": 0.0953101850953071, "3": 0.00037752679940260985, "2": 3.350744181741838e-05, "1": 0}, "score": 4.094865734821243}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9699149904854455, "5": 0.02281021082663832, "3": 0.006044105979880167, "2": 0.0012279346098288775, "1": 1.9651892634576773e-06}, "score": 4.014304351401358}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.58507700964226, "5": 0.41488172473931184, "3": 3.410686071238502e-05, "2": 6.821801305102083e-06, "1": 0}, "score": 4.414834114057004}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9313520932143883, "5": 0.06746691833378803, "3": 0.000947443740075134, "2": 0.00023218107384761022, "1": 0}, "score": 4.066055202521396}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt4", "target_model": "human", "scores": {"4": 0.46457281642013365, "2": 0.40998407151576977, "3": 0.12503809851478734, "5": 0.0002822021217415335, "1": 0.00011949189657259238}, "score": 3.054914347644581}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.644013448713716, "5": 0.35565799432034634, "3": 0.0002907167885258859, "2": 3.638747266908732e-05, "1": 0}, "score": 4.355295018725242}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8392689866699005, "5": 0.16017727633630824, "3": 0.0004864633466893559, "2": 6.687241551497137e-05, "1": 0}, "score": 4.15955713217795}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8915224363766001, "5": 0.10647715754318951, "3": 0.0014492631849660949, "2": 0.0005500782594229999, "1": 0}, "score": 4.1039278484846875}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9142921131101056, "5": 0.08504242749706194, "3": 0.00038170774790657067, "2": 0.0002836611970754712, "1": 0}, "score": 4.084093404961072}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6723379453514527, "5": 0.31758997975394027, "2": 0.007353205046911415, "3": 0.0027050929634768006, "1": 1.2724325535964783e-05}, "score": 4.300140619635648}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6001656011084963, "4": 0.3997964805424428, "3": 2.089135752635543e-05, "2": 1.6270205600950295e-05, "1": 0}, "score": 4.60011262349656}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8897602949936446, "5": 0.10963997889951563, "3": 0.000322735324322327, "2": 0.000276050151616148, "1": 2.1531193496442268e-07}, "score": 4.108764576225166}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6513403775723756, "4": 0.348637387924236, "3": 1.3538501076075273e-05, "2": 8.084208233772598e-06, "1": 0}, "score": 4.651311069123088}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6001357496139099, "4": 0.3997765951600542, "3": 5.17040729028817e-05, "2": 3.553565497597741e-05, "1": 0}, "score": 4.600013223535444}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5621612547977216, "5": 0.43781162544886915, "3": 2.435332907796002e-05, "2": 2.566822000316889e-06, "1": 0}, "score": 4.437782225858143}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9932805421993116, "5": 0.005051894285449213, "3": 0.0008917123098460292, "2": 0.0007747330806491476, "1": 4.5612793845328744e-07}, "score": 4.00260934915787}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9452390552131512, "5": 0.05332674453589911, "3": 0.0012346814220911121, "2": 0.00019843142172967454, "1": 0}, "score": 4.051695256484138}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7122305028533965, "4": 0.28776713066453774, "3": 1.5361534897632563e-06, "2": 6.304361219479434e-07, "1": 0}, "score": 4.712227848196635}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5077965772930647, "5": 0.49217331906577394, "3": 1.9413361341822825e-05, "2": 1.0230122535681428e-05, "1": 0}, "score": 4.492133671918255}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9226692048455967, "3": 0.050451923805287305, "2": 0.025768321250453575, "5": 0.0010973474723838278, "1": 9.493919660546815e-06}, "score": 3.8990799251242576}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6582866856934625, "5": 0.3415146165029871, "3": 0.00016410731243729574, "2": 3.3865458037294225e-05, "1": 0}, "score": 4.341283025715957}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.978965099714236, "5": 0.016844024738505457, "2": 0.0022094552213866503, "3": 0.001980542860270777, "1": 3.089739091566078e-07}, "score": 4.0104436504508625}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774740919596898, "5": 0.4224890709894793, "3": 2.541067999676275e-05, "2": 1.110110394596304e-05, "1": 0}, "score": 4.422441595507855}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6925767615916297, "5": 0.3073290442480451, "3": 8.68167484863073e-05, "2": 6.907097858084545e-06, "1": 0}, "score": 4.307228557797728}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9796998036990399, "3": 0.010883480389141128, "5": 0.006705117755910185, "2": 0.0027091124688513007, "1": 1.203972562450121e-06}, "score": 3.990399788206649}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9787076500877391, "3": 0.00860082199049555, "2": 0.007709727004580414, "5": 0.00497777387966867, "1": 2.2824240498830567e-06}, "score": 3.9809506173740536}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9832658832245278, "5": 0.008776955372334876, "3": 0.006522479395151036, "2": 0.00143279857754233, "1": 8.568525387128314e-07}, "score": 3.99938630763448}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8220403150957339, "5": 0.1777786752183512, "3": 0.0001595998201226924, "2": 1.9976259789305624e-05, "1": 0}, "score": 4.177579377457511}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9852001238748729, "5": 0.010122084075606896, "3": 0.003609140224361316, "2": 0.0010668598125189621, "1": 5.047078953867743e-07}, "score": 4.004377715737976}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7929624343761988, "5": 0.20685661642537131, "3": 0.00014017709085952076, "2": 4.016140894115941e-05, "1": 0}, "score": 4.2066362427090995}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8029649217396083, "5": 0.19677500687799934, "3": 0.0002452594323783675, "2": 1.4054484944366755e-05, "1": 0}, "score": 4.196501787318971}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7661136286260396, "5": 0.23365145093261677, "3": 0.0002001536973101664, "2": 3.424226014368217e-05, "1": 1.1601457583312263e-07}, "score": 4.233382560000906}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.917295859745089, "4": 0.08269673150856183, "3": 5.377962354764217e-06, "2": 1.6401858489798391e-06, "1": 0}, "score": 4.9172875597018555}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9805619198885739, "3": 0.007256341520161414, "5": 0.007033087362051039, "2": 0.005145516633823648, "1": 2.148201666536535e-06}, "score": 3.9894792575916482}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8069464498315311, "2": 0.16914517654600295, "3": 0.01957997340802401, "5": 0.004168816901888873, "1": 0.00015666935382514192}, "score": 3.645827450296191}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9478901916774313, "5": 0.04574070853581207, "3": 0.004896956447558473, "2": 0.0014703329606442319, "1": 8.792988574044294e-07}, "score": 4.037900483558762}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8977198907563011, "5": 0.06014347627797023, "2": 0.024300161076379775, "3": 0.017778377629400283, "1": 5.4843767816764816e-05}, "score": 3.9936002243899402}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6075427292663534, "5": 0.392259079660573, "3": 0.00016376419502998757, "2": 3.3794651758241305e-05, "1": 1.402859496358556e-07}, "score": 4.392027498158316}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.968466890587288, "2": 0.013181828850657976, "3": 0.011100212796408432, "5": 0.007166836035037135, "1": 7.838201950182712e-05}, "score": 3.9694676408733267}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9044376134923751, "2": 0.08412579843561471, "3": 0.009738268005344112, "5": 0.0016922572336659466, "1": 4.4652203247696705e-06}, "score": 3.823688715018974}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9805089621499528, "5": 0.019116879323080677, "3": 0.00029948866126706795, "2": 7.454862208670962e-05, "1": 0}, "score": 4.018668295681051}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9436931534387277, "2": 0.029401655402945526, "3": 0.015016896177085636, "5": 0.011879342638953636, "1": 7.329677795423456e-06}, "score": 3.938037046077506}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9675380980732492, "5": 0.032088726817936966, "3": 0.0003145866509684137, "2": 5.819267908828769e-05, "1": 0}, "score": 4.031657767338264}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.973958518554119, "5": 0.022905310402496028, "2": 0.0018223348781940822, "3": 0.001312578573193585, "1": 6.209526536680139e-07}, "score": 4.0179462106402175}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt4", "target_model": "human", "scores": {"4": 0.984288287241213, "3": 0.010598040006588295, "2": 0.004281995241906958, "5": 0.00083010264180018, "1": 6.680104632396684e-07}, "score": 3.9816660514937197}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9844965620364639, "5": 0.013192259802176308, "3": 0.0019304541362277093, "2": 0.0003801289578694637, "1": 0}, "score": 4.01050155399934}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7927346331370471, "5": 0.20679717437604225, "3": 0.00030608705592084264, "2": 0.00016129654383500896, "1": 2.5813942268069863e-07}, "score": 4.2061678333606505}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7490408931195025, "5": 0.250897296720052, "3": 4.8711958675582056e-05, "2": 1.2707273651265085e-05, "1": 0}, "score": 4.250823268267942}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8631054200748752, "5": 0.136563100014913, "3": 0.00024381666208493435, "2": 8.693550813521437e-05, "1": 2.0243560519687658e-07}, "score": 4.136144876547243}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9412279033501597, "5": 0.051466714533754856, "3": 0.005865338988477977, "2": 0.0014373631353742206, "1": 1.352311780568268e-06}, "score": 4.042722649061212}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9325715790824145, "5": 0.06547679984006038, "3": 0.0017723757513215352, "2": 0.0001782525844066394, "1": 3.387735320022227e-07}, "score": 4.063346944026221}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9502188001108778, "2": 0.02003172524426331, "3": 0.017956322457864726, "5": 0.01177604377142173, "1": 1.3788329665502557e-05}, "score": 3.953714752165035}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7429993344687309, "5": 0.256773706866451, "3": 0.00016346118441522948, "2": 6.204286753372197e-05, "1": 3.927136957936545e-07}, "score": 4.25648525416736}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6652861500846392, "5": 0.3345268946850781, "3": 0.00016074954907221452, "2": 2.5434272052820668e-05, "1": 0}, "score": 4.334315534485966}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt4", "target_model": "human", "scores": {"4": 0.974854841091452, "2": 0.011894050046462153, "3": 0.011000198069804668, "5": 0.002234825790588432, "1": 1.2879907744600686e-05}, "score": 3.9674077834435098}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9522945755071783, "5": 0.047411958171487086, "3": 0.0002690116152302566, "2": 2.3876138186519214e-05, "1": 0}, "score": 4.047095221527668}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6924467494350316, "5": 0.30727139472703835, "3": 0.0002511653677781439, "2": 2.999742539954602e-05, "1": 0}, "score": 4.306960447245788}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6297634791554474, "4": 0.37021887284863625, "3": 1.4602964527982528e-05, "2": 2.9667721925631554e-06, "1": 0}, "score": 4.629742991929715}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9963637927713188, "5": 0.0017241553510198373, "3": 0.0016452005291095746, "2": 0.00026440778669115317, "1": 1.5722261704093062e-06}, "score": 3.999545422173927}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9661643100638827, "3": 0.013998621758981759, "5": 0.011605265052589612, "2": 0.008229365197615973, "1": 1.4776670964748453e-06}, "score": 3.9811434617899097}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7430213870162361, "5": 0.2567813331587948, "3": 0.00016346608832432032, "2": 3.3210150195075956e-05, "1": 0}, "score": 4.256551601621151}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6722956230099025, "4": 0.32765075801804805, "3": 3.9808384580877366e-05, "2": 1.3334138591228171e-05, "1": 0}, "score": 4.672229466631114}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6583989133902286, "4": 0.34157284970934054, "2": 1.4797253037431563e-05, "3": 1.2656761242552652e-05, "1": 0}, "score": 4.658357177541628}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9722636572394421, "5": 0.02673242315308724, "3": 0.0005905962134714578, "2": 0.00041230260502329006, "1": 2.142217807347e-07}, "score": 4.025316599483766}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6239620997733606, "2": 0.34458461563793175, "3": 0.031065245273634468, "5": 0.0002564594488509475, "1": 0.00012305058831910953}, "score": 3.279646687040801}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6369836824411542, "4": 0.3629423764065209, "3": 6.218560598698276e-05, "2": 1.1149264793888318e-05, "1": 0}, "score": 4.636899584446043}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6150413178108798, "4": 0.3848830103856935, "3": 6.292506399116423e-05, "2": 1.2585804576927268e-05, "1": 0}, "score": 4.614953320105161}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6224358426318244, "5": 0.37752642981079787, "3": 2.9614720679607e-05, "2": 7.970693939550879e-06, "1": 0}, "score": 4.37748092735842}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5389532750767885, "5": 0.460991165473963, "3": 4.643296028231013e-05, "2": 8.861885549666037e-06, "1": 0}, "score": 4.460927130705475}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt4", "target_model": "human", "scores": {"5": 0.6583907492943201, "4": 0.3415686142322642, "3": 3.2319784242463945e-05, "2": 7.920303754757265e-06, "1": 0}, "score": 4.658342849860075}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9148508613971491, "4": 0.08509437876924075, "3": 4.4212898066059143e-05, "2": 1.0020585809445427e-05, "1": 0}, "score": 4.914787088825404}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5697836224274361, "4": 0.43009524277298067, "3": 0.00010890887876389067, "2": 1.2029795828304169e-05, "1": 0}, "score": 4.569650765679768}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9324507069882235, "4": 0.06754650198517788, "3": 1.8599908306674473e-06, "2": 6.736440373781576e-07, "1": 0}, "score": 4.9324477397136555}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6297674844639116, "4": 0.37022120523488217, "3": 9.138365662770272e-06, "2": 2.0711552801868e-06, "1": 0}, "score": 4.62975426725449}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8701903309965917, "5": 0.12934224833206498, "3": 0.00038073068359146454, "2": 8.629033147884451e-05, "1": 0}, "score": 4.128788988456843}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8627239168770094, "5": 0.13650275246249796, "3": 0.0005323093780298645, "2": 0.00023993080228693967, "1": 4.1518775389593253e-07}, "score": 4.135489427411617}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.940804937178733, "5": 0.04198703495086137, "3": 0.010129843601316593, "2": 0.007071770543112671, "1": 4.717908363075875e-06}, "score": 4.017699526553399}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8518113899139077, "5": 0.14802263170247584, "3": 0.00013082630900303658, "2": 3.4665520865290976e-05, "1": 0}, "score": 4.147822546275356}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9782584128801475, "5": 0.020947593666470365, "3": 0.000549580004297805, "2": 0.00024387469735643382, "1": 0}, "score": 4.019910274994155}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9782061606025636, "5": 0.016570030613826826, "3": 0.0044597632380422875, "2": 0.0007629755284491448, "1": 4.422413779367052e-07}, "score": 4.010582996238501}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8265115394430096, "5": 0.17324623027903854, "3": 0.00020604499308280914, "2": 3.525014201217245e-05, "1": 0}, "score": 4.172969846753449}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9535949179654569, "5": 0.04601599157371447, "3": 0.0003458894647455583, "2": 4.262195763669994e-05, "1": 0}, "score": 4.045584884589096}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7490776120040558, "4": 0.2509095658978406, "3": 8.07762228819943e-06, "2": 3.8155985946207525e-06, "1": 0}, "score": 4.749062598971763}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.904014309158571, "5": 0.09528239669707866, "3": 0.0005158678138553442, "2": 0.00018683494087670056, "1": 0}, "score": 4.09439291482446}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8093029802369405, "3": 0.10615744040265833, "2": 0.0826754977144463, "5": 0.0018553040277334764, "1": 7.822886139107998e-06}, "score": 3.7303231420686176}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9513395509005942, "5": 0.04736440413569008, "3": 0.0011139040190844658, "2": 0.00018183988697192537, "1": 0}, "score": 4.045886834157244}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.872993629866674, "5": 0.12576665920618596, "3": 0.0011052298020258749, "2": 0.00013407958719922094, "1": 0}, "score": 4.124393320178395}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774233919601782, "5": 0.42245197807744905, "3": 0.00010865813289397325, "2": 1.5172074860920673e-05, "1": 0}, "score": 4.4223133135418555}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9856259868721463, "5": 0.008010693038373649, "3": 0.005012963609265047, "2": 0.0013492208517459586, "1": 0}, "score": 4.000299288065497}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9892776298579952, "5": 0.008040369010629695, "3": 0.00155869663082569, "2": 0.0011226870671313238, "1": 2.1126448605895717e-07}, "score": 4.00423566617248}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6222504466104128, "5": 0.3774139814373741, "3": 0.0002478868911276524, "2": 8.70164827811371e-05, "1": 0}, "score": 4.376992313629566}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8807731303495363, "4": 0.11919966914308497, "3": 2.3142726890298952e-05, "2": 3.837440308347303e-06, "1": 0}, "score": 4.880742506804991}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6791521207942781, "4": 0.3208087268378182, "3": 2.2913483993823053e-05, "2": 1.5996189825333635e-05, "1": 0}, "score": 4.679097379743551}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5850855810832368, "5": 0.414887802801101, "3": 2.3810783301537864e-05, "2": 2.7135657853798778e-06, "1": 0}, "score": 4.414858602956383}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9577371809864593, "3": 0.02435405289444481, "5": 0.010474547627765307, "2": 0.007427566481083365, "1": 5.615072825752529e-06}, "score": 3.9712484867391566}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9958300009922625, "3": 0.001805931958402918, "5": 0.0016965160722760238, "2": 0.0006643652396509139, "1": 2.1145278693652715e-06}, "score": 3.99855550850361}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9705437311068073, "5": 0.025068354629971246, "3": 0.0031376737423801926, "2": 0.001248080385064291, "1": 1.2696440149182992e-06}, "score": 4.019430728488321}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8932565851334985, "5": 0.10668428645313031, "3": 4.9687508225752526e-05, "2": 8.908479339630182e-06, "1": 0}, "score": 4.1066168387517825}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9576499351033818, "5": 0.040781652187693064, "3": 0.0010209486856249464, "2": 0.0005464744519121943, "1": 5.917698763596417e-07}, "score": 4.038665994670006}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9608393745986661, "3": 0.024054143749387684, "2": 0.010508477149258044, "5": 0.004590813672147008, "1": 4.743676926900786e-06}, "score": 3.95950538549692}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9733836067025247, "3": 0.011156566842023957, "5": 0.011156566842023957, "2": 0.004301239680679557, "1": 1.1962103978174588e-06}, "score": 3.991393924918431}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9224015681065032, "5": 0.07571533977739132, "3": 0.0015470583344340113, "2": 0.0003345751633669352, "1": 5.69988871495791e-07}, "score": 4.073497486461639}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9016338198816162, "5": 0.09804812004063851, "3": 0.0002797338339306506, "2": 3.7857857645868183e-05, "1": 0}, "score": 4.097692716249333}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6456720026351078, "2": 0.23752946501062788, "3": 0.11576259266626866, "1": 0.001001542667671565, "5": 1.544710424029389e-05}, "score": 3.406178043537458}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8759792460939244, "5": 0.1223140942102126, "3": 0.0014691988893127852, "2": 0.00023612174908705071, "1": 6.736615523508231e-07}, "score": 4.120370710932248}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7430682880063643, "5": 0.25679753657212945, "3": 0.00011960181990099631, "2": 1.3418952293465952e-05, "1": 0}, "score": 4.256651393189996}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.531118616206476, "5": 0.4687105337072316, "3": 0.00013660800647367867, "2": 3.3477231731695984e-05, "1": 2.4773777724218663e-07}, "score": 4.468506470293489}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8438878773101652, "4": 0.15610355154342442, "3": 5.34961479811952e-06, "2": 2.689955250475135e-06, "1": 0}, "score": 4.843877596370249}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5467248606987251, "5": 0.45325082915236625, "3": 1.84456128806409e-05, "2": 5.3679793777666e-06, "1": 0}, "score": 4.453221872631065}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5620319669568237, "5": 0.43771093597713623, "3": 0.00023833769581190468, "2": 1.809369541469458e-05, "1": 0}, "score": 4.43743670208109}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.78771597650835, "5": 0.2120108767927572, "3": 0.0001903315512461792, "2": 8.186058013569102e-05, "1": 0}, "score": 4.211657026122161}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9099441363335972, "5": 0.08732469334039646, "3": 0.002438804545758216, "2": 0.00029127375330438544, "1": 0}, "score": 4.08430343334965}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7247783028956019, "5": 0.27509483120885564, "3": 9.228397962931628e-05, "2": 3.3423042521402186e-05, "1": 0}, "score": 4.274936019760221}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6370041681657903, "5": 0.3629540270437952, "3": 3.1762347836327184e-05, "2": 9.686968783886788e-06, "1": 0}, "score": 4.362903019760905}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9129835007665692, "2": 0.07263651660974035, "3": 0.012622336454245379, "5": 0.0017351484626386064, "1": 2.051892350105628e-05}, "score": 3.843777912888752}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6722742577944982, "4": 0.3276403061255758, "3": 6.666443204307559e-05, "2": 1.7942488474498604e-05, "1": 0}, "score": 4.6721722657234634}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9664777759105895, "5": 0.027416863464336957, "2": 0.00388853810682286, "3": 0.0022156222265793646, "1": 5.270491652827009e-07}, "score": 4.017422595606248}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5543885412838322, "5": 0.445463707516109, "3": 0.00010763496602155861, "2": 3.959669115051816e-05, "1": 0}, "score": 4.445277110508343}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8833353779608476, "5": 0.1158683785234563, "3": 0.000437941595537743, "2": 0.0003574375129709563, "1": 0}, "score": 4.114715661063019}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8712198090161837, "5": 0.12551110980320737, "2": 0.001735237478037965, "3": 0.001531341699617209, "1": 1.9086564361576506e-06}, "score": 4.120503638678621}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8435263741235398, "5": 0.1560366911044718, "3": 0.00035770962644437185, "2": 7.857837685523667e-05, "1": 2.662276678660629e-07}, "score": 4.155521085223466}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7971503285285109, "5": 0.20155116686076957, "3": 0.0009480654670727827, "2": 0.00034877379422067775, "1": 7.167154048770393e-07}, "score": 4.19990359329439}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7718092461257016, "4": 0.22814638878111068, "3": 2.950670595333045e-05, "2": 1.4380419983687284e-05, "1": 0}, "score": 4.771751347451651}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9393691087045811, "5": 0.060051863407802525, "3": 0.0004805055880331548, "2": 9.762060207372133e-05, "1": 0}, "score": 4.059376170154967}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9365549433489389, "2": 0.036314179287514375, "3": 0.026986406573424694, "5": 0.00013303184796827842, "1": 8.114994782038167e-06}, "score": 3.900493590961102}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9827338168746812, "5": 0.015884412444742077, "3": 0.001115260800084111, "2": 0.00026489765874103405, "1": 9.40558489825779e-07}, "score": 4.01423654421387}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9672332139102734, "5": 0.03207861404510067, "3": 0.0005606348811874774, "2": 0.00012706446523697378, "1": 0}, "score": 4.031263865011811}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.798132432330506, "5": 0.20179946948113578, "3": 6.260871952633773e-05, "2": 5.059560176920554e-06, "1": 0}, "score": 4.2017268283653655}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9930744131804444, "5": 0.006092480336274215, "3": 0.0006729597748612289, "2": 0.00015984211678537092, "1": 1.2273982079794615e-07}, "score": 4.005099469035728}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9726941979656326, "5": 0.02512390237812409, "3": 0.0016831965249040183, "2": 0.0004975519423907804, "1": 3.267942725405021e-07}, "score": 4.022444640088861}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9340254058491045, "5": 0.059710248897070176, "2": 0.003757969101816688, "3": 0.0025033471063963114, "1": 1.406365276434462e-06}, "score": 4.049686825117045}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8391854583845113, "5": 0.1601613555063188, "3": 0.0004292596832108537, "2": 0.00022269698994054467, "1": 4.576329011953974e-07}, "score": 4.15928545188153}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7825217198157584, "5": 0.21729845537619213, "3": 0.00015921835435896216, "2": 1.99285137505498e-05, "1": 0}, "score": 4.217099527174772}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.987237840921609, "5": 0.007656356968031561, "3": 0.0037314103756436816, "2": 0.0013727091637731194, "1": 6.493986864454449e-07}, "score": 4.001177581285426}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9904605331683238, "5": 0.004882561008260777, "3": 0.002613446580112785, "2": 0.002035354243107122, "1": 4.248434482274404e-06}, "score": 3.998185653641341}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8632480686633249, "5": 0.13658567576117947, "3": 0.00014790683139957224, "2": 1.766495190097616e-05, "1": 0}, "score": 4.136402532296964}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8927262375498912, "5": 0.10662094546637359, "3": 0.000478561753008037, "2": 0.0001733236330146394, "1": 2.0294110969832966e-07}, "score": 4.105795204712382}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7185924722033632, "4": 0.2814048497743312, "3": 1.729010981368809e-06, "2": 7.793263065703123e-07, "1": 0}, "score": 4.718589306473609}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.944956140249383, "5": 0.05500304124031165, "3": 3.1386992577473075e-05, "2": 9.134135578808415e-06, "1": 0}, "score": 4.054953402318738}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6369324837504625, "5": 0.36291319701248514, "3": 0.00010913040660159771, "2": 4.409267010927658e-05, "1": 0}, "score": 4.362716278860865}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8126251466442926, "5": 0.18707694054197946, "3": 0.0002443619573760859, "2": 5.284697947881703e-05, "1": 0}, "score": 4.186727016058473}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9692080735081678, "5": 0.030196598300556144, "3": 0.0005115062774594014, "2": 8.350107933694906e-05, "1": 0}, "score": 4.0295180993348465}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8395515573470983, "5": 0.16023121710566962, "3": 0.00017902000474787576, "2": 3.752463152299835e-05, "1": 0}, "score": 4.159977256768144}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8175398428231568, "5": 0.1824178033535651, "3": 3.654080414515504e-05, "2": 5.43130565936972e-06, "1": 0}, "score": 4.182370469551367}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7309092002585776, "5": 0.2688864520050037, "3": 0.00017117211280828898, "2": 3.266876942109347e-05, "1": 1.536688307108507e-07}, "score": 4.268649576229957}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9297077960509329, "5": 0.06948565156692886, "3": 0.0005223043991017771, "2": 0.0002795693987849703, "1": 3.519259358536961e-06}, "score": 4.068393729882736}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8557685884369884, "5": 0.14413494502473007, "3": 7.848288362063418e-05, "2": 1.778767066384668e-05, "1": 0}, "score": 4.1440209150255765}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8175384938835291, "5": 0.18241749324356302, "3": 2.9823705324263444e-05, "2": 1.3869311005966102e-05, "1": 0}, "score": 4.18235998924527}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9855819771903459, "5": 0.013206805685788133, "3": 0.0009870666430396872, "2": 0.0002237126817934927, "1": 0}, "score": 4.011772318833072}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6086284049494715, "2": 0.26176783343382487, "3": 0.1275754276362121, "5": 0.0018197666507266362, "1": 0.0002041719555120912}, "score": 3.350093299697151}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8768538483863296, "5": 0.12243622460916662, "3": 0.000558201806819322, "2": 0.00015023797815945364, "1": 0}, "score": 4.121577727658799}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9776619979995839, "5": 0.012306951667945275, "3": 0.007822774437054054, "2": 0.002206514848150392, "1": 8.790122526960218e-07}, "score": 4.000068510558261}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6512241367154292, "5": 0.3485751617043468, "3": 0.00017013777635560036, "2": 2.9565512327202576e-05, "1": 0}, "score": 4.348346240654442}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9155849667988671, "5": 0.08000291559778859, "2": 0.003053957464751328, "3": 0.0013551854100854362, "1": 1.4223615561579928e-06}, "score": 4.072535660775495}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7309766443619714, "5": 0.26891127136991994, "3": 9.753990320938619e-05, "2": 1.405195536474576e-05, "1": 0}, "score": 4.268785759908652}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6722279262492545, "4": 0.3276177324861546, "3": 0.00012260619568160768, "2": 3.004594042857725e-05, "1": 4.4915041738235173e-07}, "score": 4.672044714042166}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7660198007749405, "5": 0.2336228537452062, "3": 0.00030516071063981133, "2": 5.1397449878124224e-05, "1": 2.9621745709479863e-07}, "score": 4.233214124014332}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6442174658419485, "4": 0.35577064904508165, "3": 8.511486106619974e-06, "2": 2.763274965400488e-06, "1": 0}, "score": 4.644203820996936}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6991246964682251, "5": 0.30068980313148147, "3": 0.00016372849832655304, "2": 2.114354288566463e-05, "1": 0}, "score": 4.300483976359219}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9662378669527153, "5": 0.01742289731857284, "3": 0.009927267649173259, "2": 0.006409525729143998, "1": 1.2251209305789615e-06}, "score": 3.994672896364012}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7974835352426657, "5": 0.20163543285888402, "3": 0.0007048369912303592, "2": 0.00017544771143373068, "1": 2.4016983933130477e-07}, "score": 4.200579081634067}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6652911264436534, "4": 0.3345294036461968, "3": 0.00015101128331509761, "2": 2.7074831189991972e-05, "1": 0}, "score": 4.665086885842294}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6654054199697439, "4": 0.3345868472761974, "3": 5.676169139750988e-06, "2": 1.5762152435462507e-06, "1": 0}, "score": 4.665396911006615}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5389509360246504, "4": 0.4609891647766463, "3": 3.789728819571791e-05, "2": 2.1593223917798015e-05, "1": 0}, "score": 4.538870072517592}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8684078946411804, "2": 0.07354603811050711, "3": 0.05380743092875235, "5": 0.004214523679347456, "1": 2.2115783916425213e-05}, "score": 3.803248276292913}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8974297541853379, "5": 0.10068884096957981, "3": 0.0014818401780427998, "2": 0.00039883187332042335, "1": 4.057230714899819e-07}, "score": 4.0984081520621}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7234725023933734, "2": 0.20090104612141846, "5": 0.05407178301945315, "3": 0.021508269282592155, "1": 4.489464658756955e-05}, "score": 3.6306261818178425}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8860566600737123, "5": 0.11264947190974033, "3": 0.0011043763416953047, "2": 0.00018893642030549493, "1": 0}, "score": 4.111167284453574}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9271010006837257, "3": 0.03767277100458185, "4": 0.03484161755415338, "1": 0.0003693308511724313, "5": 9.10266800545376e-06}, "score": 2.1070146443206985}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8680687520740058, "4": 0.1103625636520798, "3": 0.021063063868987632, "1": 0.0004653436933089406, "5": 3.6448545656139874e-05}, "score": 2.2414331173628486}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9970434365675167, "3": 0.0015225998159057368, "2": 0.0012234433227750678, "5": 0.0002093064734377348, "1": 0}, "score": 3.996239815447793}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9754455597606003, "5": 0.014355659848612767, "3": 0.006271523320613256, "2": 0.003924619009902063, "1": 1.5880781238028969e-06}, "score": 4.000230134515462}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9696110211830445, "5": 0.03020915665683086, "3": 0.00014433695883444824, "2": 3.482291189634567e-05, "1": 0}, "score": 4.029995193739702}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9747065691482435, "5": 0.025175882156959303, "3": 9.079839034428568e-05, "2": 2.6423838018094223e-05, "1": 0}, "score": 4.025032244262766}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9891282038332694, "3": 0.005439563284072139, "5": 0.003197754289735806, "2": 0.0022323922737885805, "1": 1.466244775729365e-06}, "score": 3.9932890035624427}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9864364689987533, "5": 0.009977666835585248, "3": 0.002191802531387956, "2": 0.0013931944543400239, "1": 0}, "score": 4.004999479730966}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9637144942773592, "5": 0.03402328621903932, "3": 0.0019803929388508518, "2": 0.00028087916469336094, "1": 2.769410968839257e-07}, "score": 4.031480325233778}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9171886478843739, "5": 0.08268707309438401, "3": 9.834124853064614e-05, "2": 2.5653847438337663e-05, "1": 0}, "score": 4.082537447585444}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9126309016052795, "2": 0.06611076407977443, "3": 0.02080267489129868, "5": 0.00045246551847184487, "1": 2.527451689957585e-06}, "score": 3.847420578425467}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt4", "target_model": "human", "scores": {"4": 0.4964865179722654, "2": 0.42466742321870987, "3": 0.07855557051424598, "5": 0.00021054229471767152, "1": 7.745418172369011e-05}, "score": 3.0720854506033914}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5311834697487431, "5": 0.4687677667574039, "3": 3.620195264925993e-05, "2": 1.104097175171796e-05, "1": 0}, "score": 4.468710195567656}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5155624182117832, "5": 0.4843260703638534, "3": 9.403232047043916e-05, "2": 1.6859066072752425e-05, "1": 1.7321244327665305e-07}, "score": 4.484198016625868}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6925996654838494, "5": 0.3073392477416912, "3": 4.647119033813261e-05, "2": 1.417291229462231e-05, "1": 0}, "score": 4.307264566744131}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8665629446957599, "5": 0.13289174892878805, "3": 0.000299927133842983, "2": 0.0002447933922826103, "1": 1.9699332343020025e-07}, "score": 4.132101695398947}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9281652322980575, "5": 0.06723605786406538, "3": 0.003244495535256521, "2": 0.0013525069616649365, "1": 1.0066113168689546e-06}, "score": 4.061283571514743}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8074390553373624, "5": 0.19178358579339327, "3": 0.0007136358783539464, "2": 6.235678940164164e-05, "1": 0}, "score": 4.1909454972062585}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6653712389712665, "4": 0.334569683411189, "3": 4.8271945720462736e-05, "2": 9.961479034028434e-06, "1": 0}, "score": 4.665303605711985}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5234037103361313, "4": 0.47656450144580165, "3": 2.6508980383063703e-05, "2": 4.752798288540221e-06, "1": 0}, "score": 4.52336797128069}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9044211347891787, "5": 0.09532530248944086, "3": 0.00020529039915225466, "2": 4.800477849654508e-05, "1": 7.33088132461329e-08}, "score": 4.095023801063796}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt4", "target_model": "human", "scores": {"4": 0.898178680872871, "5": 0.0491127600070546, "2": 0.03375467340468266, "3": 0.018934655719923275, "1": 1.781424749081238e-05}, "score": 3.962615261807926}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9679364293704831, "5": 0.027032538741508665, "2": 0.0031292434904036763, "3": 0.0018979821186360056, "1": 1.5273688634926437e-06}, "score": 4.018871530541997}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8253472765051438, "5": 0.17300219442971154, "3": 0.001147607429422415, "2": 0.0005013525558859769, "1": 5.96267765380683e-07}, "score": 4.170850259290416}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9968426033937637, "5": 0.0022149235295194202, "3": 0.0006969566111515665, "2": 0.00023712763914695588, "1": 3.893169307666388e-06}, "score": 4.001032036771834}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9922263185683401, "2": 0.0037502641555526325, "3": 0.002498214505671697, "5": 0.001515243692228725, "1": 4.82268852565799e-06}, "score": 3.9915019891607795}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt4", "target_model": "human", "scores": {"4": 0.62230129899471, "5": 0.3774448174192902, "3": 0.00019919904639478689, "2": 5.4457988868473336e-05, "1": 8.852719889522004e-08}, "score": 4.377136488867274}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8694544525987979, "5": 0.1038415395459896, "2": 0.017765192742575573, "3": 0.008932899899707183, "1": 5.1777497876612615e-06}, "score": 4.05936276468962}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7807092949570268, "5": 0.2167951457758735, "3": 0.0021253848226273696, "2": 0.00036933650197768284, "1": 4.0624760447368885e-07}, "score": 4.213929961558947}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8311356420083232, "4": 0.16885544248633316, "3": 6.159826169832805e-06, "2": 2.527987566516763e-06, "1": 0}, "score": 4.831124615447119}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6992177142052458, "4": 0.30072979753486684, "3": 2.8014369023776746e-05, "2": 2.4339305599560647e-05, "1": 6.22461593931802e-08}, "score": 4.69914088506177}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5198334797196624, "4": 0.3055943225211334, "3": 0.1741223963078241, "1": 0.0003929819012321028, "5": 5.235982286236563e-05}, "score": 2.785078640154079}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9660958732727378, "5": 0.022021361928196637, "2": 0.009925808448082737, "3": 0.001954507569267913, "1": 1.5244642821732716e-06}, "score": 4.000210664264638}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9441771835598897, "5": 0.023637011772422042, "2": 0.021188080414965966, "3": 0.010992236808726399, "1": 4.049905542327127e-06}, "score": 3.9702564216595984}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.4999573420997726, "5": 0.4999573420997726, "3": 6.074304304980211e-05, "2": 2.3787317439773535e-05, "1": 0}, "score": 4.499849417023553}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9599697331365815, "2": 0.029445078399937458, "3": 0.005619691555194703, "5": 0.004959360390940133, "1": 2.8300151300952747e-06}, "score": 3.940440825057936}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9819379028638237, "5": 0.014006594843933188, "3": 0.0035971910570982172, "2": 0.00045733152154074565, "1": 0}, "score": 4.0094947500458895}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9893582563023577, "5": 0.00535647590791877, "3": 0.004581636638673103, "2": 0.0007026167348192232, "1": 0}, "score": 3.9993696051601244}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8431646716677696, "5": 0.15596978131748662, "3": 0.0008313430769433161, "2": 3.325790748630189e-05, "1": 0}, "score": 4.155072069128449}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7980677383376242, "5": 0.20178310420778167, "3": 0.00011514573166408679, "2": 3.350931828670083e-05, "1": 0}, "score": 4.201601041124843}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9723324074609829, "3": 0.01523274944704999, "2": 0.010801636808423009, "5": 0.0016308032404340907, "1": 0}, "score": 3.9647946955766735}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5962414181040889, "4": 0.29980902211118116, "3": 0.10361122558076988, "5": 0.0002489247290926119, "1": 8.738079817109857e-05}, "score": 2.703890091157664}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9546519100872667, "5": 0.04464966832583434, "3": 0.0004446230559684306, "2": 0.0002533385047686246, "1": 0}, "score": 4.0436983883627295}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8927570282088061, "2": 0.04958505505644023, "3": 0.04658084844034534, "5": 0.011063919062928184, "1": 1.0739677470652375e-05}, "score": 3.865280416863179}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9407976610214859, "5": 0.05649928476140758, "3": 0.002156751768552086, "2": 0.0005453122454118815, "1": 2.579750402298198e-07}, "score": 4.053251173568916}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9821213901925954, "3": 0.010574709763059518, "2": 0.004076913793337666, "5": 0.0032251042618537617, "1": 1.0989383286449617e-06}, "score": 3.9844932579545658}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9523591185068827, "5": 0.04741517281122617, "3": 0.0001937749739947569, "2": 3.114247235126984e-05, "1": 0}, "score": 4.047159150206524}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.94165378293711, "4": 0.05834581180187823, "3": 2.835881010426297e-07, "2": 9.351743008537972e-08, "1": 0}, "score": 4.9416533388268515}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8927262375498912, "5": 0.10662094546637359, "3": 0.000478561753008037, "2": 0.0001733236330146394, "1": 2.0294110969832966e-07}, "score": 4.105795204712382}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7057838287128358, "4": 0.29421449583082193, "3": 9.828385228780108e-07, "2": 3.615660865581284e-07, "1": 0}, "score": 4.705782356392612}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6584155118360577, "5": 0.3415814916117578, "3": 2.6119356059826055e-06, "2": 3.8221062727234505e-07, "1": 0}, "score": 4.341578116076717}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9069193113067031, "3": 0.05116488612952422, "2": 0.03984725338343272, "5": 0.002046852564613989, "1": 1.885086041036046e-05}, "score": 3.8711305403560434}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9253013969515888, "5": 0.07361652161309726, "3": 0.0006077414579928072, "2": 0.00047330952338975557, "1": 3.30921053195752e-07}, "score": 4.0720612187543574}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9537949612004706, "5": 0.033673082488486515, "3": 0.007751983754876764, "2": 0.004775858646303248, "1": 3.0881696155338784e-06}, "score": 4.016360133713404}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9851012048967449, "5": 0.011649278875324886, "3": 0.0019620586996781293, "2": 0.0012867495103034599, "1": 2.1037251431529095e-07}, "score": 4.007113093577296}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9941132492185208, "5": 0.004603658341193721, "3": 0.0010272150229392097, "2": 0.0002556940360376391, "1": 6.68023217681225e-08}, "score": 4.003064855196512}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.86417896172562, "3": 0.08691276191616747, "2": 0.041054681735540575, "5": 0.00783542155921, "1": 1.466055506018221e-05}, "score": 3.8387687481806543}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8384013962854, "2": 0.08432024403837676, "3": 0.07558417825806302, "5": 0.0016698725046313356, "1": 2.272867988220547e-05}, "score": 3.7573766367285657}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7384352563355806, "5": 0.2551964087262045, "3": 0.0056380236023536425, "2": 0.0007280821301432583, "1": 1.2999015852711826e-06}, "score": 4.248098551717818}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8962460807685394, "4": 0.10374802045553545, "3": 5.254556253090481e-06, "2": 4.811725015751764e-07, "1": 0}, "score": 4.89624000999668}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.8354634234016086, "4": 0.16451250391896666, "3": 2.0946918724554362e-05, "2": 2.879499683254107e-06, "1": 0}, "score": 4.8354369232190635}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt4", "target_model": "human", "scores": {"4": 0.835855916028065, "2": 0.11671164020226489, "3": 0.03970913567515233, "5": 0.007578621166728092, "1": 0.0001409931852943278}, "score": 3.7340222430778187}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5926606520647972, "4": 0.4073293121254018, "3": 7.4717374163999505e-06, "2": 2.278751164335674e-06, "1": 0}, "score": 4.592648791920328}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8422227592922933, "5": 0.15100222608365774, "3": 0.003780265627478047, "2": 0.002990436247644485, "1": 3.090010713217347e-06}, "score": 4.141231990618503}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.699229824760933, "5": 0.3007350002053672, "3": 2.396236699872967e-05, "2": 1.0800684999130694e-05, "1": 0}, "score": 4.300689560346967}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8080085086573217, "5": 0.1919188408931982, "3": 5.093007217131221e-05, "2": 2.12308127477054e-05, "1": 0}, "score": 4.19182554310652}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8737645615443966, "2": 0.11825116495863203, "3": 0.00755954406100691, "5": 0.0003944297922221641, "1": 2.12332119650991e-05}, "score": 3.7562666463862335}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7430827259634645, "5": 0.25680249281241285, "3": 8.888230314465226e-05, "2": 2.546520620692443e-05, "1": 0}, "score": 4.256662791415298}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6578831414562546, "5": 0.34130526393420496, "3": 0.0007466022334451389, "2": 6.422596434358058e-05, "1": 3.9402440024901737e-07}, "score": 4.340429154470383}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8518883715875788, "5": 0.1480359987496317, "3": 6.476961298547342e-05, "2": 1.0089159776097347e-05, "1": 0}, "score": 4.147951164871172}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8989396382314875, "5": 0.1008582210806507, "3": 0.00015891120036931386, "2": 4.2770369351572566e-05, "1": 0}, "score": 4.1006138153352065}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6434671771543443, "5": 0.3553563465043491, "3": 0.0009674140250560984, "2": 0.00020597412579506096, "1": 8.158706595492271e-07}, "score": 4.353975340960899}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8897707710930306, "5": 0.10964126169477308, "3": 0.000540486336811046, "2": 4.649494318473081e-05, "1": 0}, "score": 4.109007892945984}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8255235977682002, "5": 0.17303915164533182, "3": 0.001341975227489258, "2": 9.42215155119042e-05, "1": 0}, "score": 4.171508914130367}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5311947840771458, "4": 0.46877775161717417, "3": 2.374230689898002e-05, "2": 3.213171828864044e-06, "1": 0}, "score": 4.531164885697598}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9490650375517249, "5": 0.05029860177381924, "3": 0.0005331791894286873, "2": 0.00010175902904861405, "1": 0}, "score": 4.0495619750260206}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9169006362612286, "5": 0.08011788231093102, "3": 0.0021686921260933275, "2": 0.0008103810409379243, "1": 1.3805811834849452e-06}, "score": 4.076324364796406}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5465172540236348, "4": 0.45307871717358783, "3": 0.00034791081144102504, "2": 5.5047506004992874e-05, "1": 0}, "score": 4.546059832749225}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9151254127354972, "5": 0.07750258409634982, "3": 0.004877760882341974, "2": 0.002491316483473947, "1": 1.7418374433332145e-06}, "score": 4.067637044814617}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6150684970872355, "4": 0.38490003028872005, "3": 2.2437609758141184e-05, "2": 8.384322206543987e-06, "1": 0}, "score": 4.615029691028014}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7920896017849298, "2": 0.1767390903025225, "3": 0.026269915286865356, "5": 0.00478410650419044, "1": 0.00011428319766789857}, "score": 3.624692033998043}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt4", "target_model": "human", "scores": {"5": 0.5077215051189591, "4": 0.4921005566196464, "3": 0.00011524537581185703, "2": 6.168640448726248e-05, "1": 0}, "score": 4.507483397706618}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7371541720495685, "4": 0.26284041974332234, "3": 4.459013521130633e-06, "2": 7.510204163494001e-07, "1": 0}, "score": 4.737148357078244}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5544283145444338, "4": 0.4454956662288315, "3": 5.9445953663202794e-05, "2": 1.6507545146055128e-05, "1": 0}, "score": 4.554335889935826}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5389805198534495, "5": 0.46101446916637356, "3": 4.319154035501024e-06, "2": 5.078518833961458e-07, "1": 0}, "score": 4.461009219122401}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9775012444781496, "2": 0.015313727968979667, "3": 0.006383711569956126, "5": 0.0007990151908906072, "1": 1.1826463039061557e-06}, "score": 3.963784259249588}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt4", "target_model": "human", "scores": {"2": 0.4661583013847287, "4": 0.451816118229119, "3": 0.08100616630378539, "5": 0.0008453752046392493, "1": 0.00016908567818482462}, "score": 2.9870103315568786}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8589633618525494, "5": 0.14022191558701347, "3": 0.0005299891623624041, "2": 0.0002836827561456833, "1": 3.480989703666337e-07}, "score": 4.139123614355765}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9583167345867631, "5": 0.03715796982021621, "3": 0.0028653149633676776, "2": 0.0016583170768371687, "1": 7.143077107568897e-07}, "score": 4.030973907181871}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7825990211290907, "5": 0.2173199037921997, "2": 4.5621384182347125e-05, "3": 3.4979128602170164e-05, "1": 0}, "score": 4.217193784968003}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9067098235403415, "5": 0.09262624075407534, "3": 0.00037267344662220175, "2": 0.0002902383720592904, "1": 2.646631371927687e-07}, "score": 4.091672366173762}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9788557730389942, "5": 0.014405848629965856, "3": 0.006392556578982558, "2": 0.0003441283017236687, "1": 0}, "score": 4.007325047852141}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9799495306307837, "5": 0.019712465043716373, "3": 0.00031862235391575246, "2": 1.9134759648431785e-05, "1": 0}, "score": 4.019355577955434}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9073660473172419, "3": 0.07218960633680811, "2": 0.0163613325403968, "5": 0.004072657680022649, "1": 8.239392026143691e-06}, "score": 3.8991354545829795}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9877039568013439, "5": 0.01205082086245582, "3": 0.0002349537198554571, "2": 9.697698195964452e-06, "1": 0}, "score": 4.011796478481032}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9841459035069249, "5": 0.014483705790636639, "3": 0.0012855019684340902, "2": 8.47880453288456e-05, "1": 0}, "score": 4.013028629043379}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8937196755536482, "2": 0.0608183941744957, "3": 0.03204904157880599, "5": 0.013360024193293699, "1": 4.9713302735618024e-05}, "score": 3.859524611691664}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9688921757679849, "5": 0.024255739722926353, "3": 0.005583988349119368, "2": 0.0012655771699853558, "1": 1.3704765937093706e-06}, "score": 4.016136504137046}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5770994905739811, "4": 0.4222150067610698, "3": 0.00048669836523821747, "2": 0.00019664391556348116, "1": 8.291489696045794e-07}, "score": 4.5762177840120914}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6150217044559915, "4": 0.3848707559057352, "3": 9.013319835548469e-05, "2": 1.6159991998722602e-05, "1": 0}, "score": 4.614900017714485}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6988995866001109, "5": 0.30059296654226275, "3": 0.0004051014615044419, "2": 0.00010083772665282263, "1": 4.6697131740346103e-07}, "score": 4.299985100907441}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9811126286168066, "5": 0.015858205745118818, "3": 0.0027557429483778015, "2": 0.0002728555564645717, "1": 0}, "score": 4.012556758805167}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9684839987060172, "5": 0.025809222233863126, "3": 0.005326034041719243, "2": 0.000379835079790749, "1": 3.9866355353226044e-07}, "score": 4.019722332125437}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9345032072903563, "3": 0.05030679105277724, "2": 0.009452364094814819, "5": 0.0057331486302720416, "1": 1.953544779521812e-06}, "score": 3.9365156077960237}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9843042269347999, "5": 0.015181237326907166, "3": 0.00047298589037086735, "2": 4.0688278684642536e-05, "1": 0}, "score": 4.014626887481244}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9335760236018228, "3": 0.06554731701294203, "4": 0.0007396320686058022, "1": 0.00010327574613167161, "5": 0}, "score": 2.066925564246922}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9356938306697806, "5": 0.06367476173602134, "3": 0.0005094942453836098, "2": 0.00012101549048793744, "1": 2.061643851940083e-07}, "score": 4.06292266153973}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9572307581519203, "5": 0.042057788068405634, "3": 0.0005131405878236192, "2": 0.0001978332606459498, "1": 1.6171003708925336e-07}, "score": 4.041148508923507}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9195933017436192, "5": 0.07788096559946336, "3": 0.0018604280189778947, "2": 0.0006633560389014423, "1": 9.368908971137677e-07}, "score": 4.074691090395576}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8266469909868973, "5": 0.17327462766328333, "3": 6.2850479102852e-05, "2": 1.4928297277051383e-05, "1": 0}, "score": 4.173182024944515}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9094320365357433, "5": 0.09004596651311943, "3": 0.00039789993654744545, "2": 0.0001232636500821873, "1": 0}, "score": 4.089401613780539}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9748798825093732, "5": 0.02440564063094619, "3": 0.00037058007860373427, "2": 0.00034273054589823153, "1": 0}, "score": 4.023349626691702}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9850855946141861, "2": 0.0054173332765855035, "3": 0.004932538079379951, "5": 0.0045618519888582865, "1": 2.370221849059532e-06}, "score": 3.9887875331944977}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9585430725995943, "5": 0.04081968656893323, "3": 0.0005469841129123514, "2": 8.929268395801201e-05, "1": 0}, "score": 4.040094155740259}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.585098365342851, "5": 0.4148968681986313, "3": 3.5392348438023844e-06, "2": 9.675729639022372e-07, "1": 0}, "score": 4.414891501544734}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7122184662596078, "5": 0.2877622674411238, "3": 1.703916568346097e-05, "2": 2.0670853218669315e-06, "1": 0}, "score": 4.287741140157267}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9781191344500332, "3": 0.010207587119042093, "1": 0.00900816401541706, "4": 0.0026628081967440317, "5": 1.4053165191733362e-06}, "score": 2.0065292613288968}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8902132395092724, "4": 0.10969581082358373, "3": 7.669538660238485e-05, "2": 1.3750725109579533e-05, "1": 0}, "score": 4.890109490891921}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5617938001846877, "5": 0.4375254515084952, "3": 0.0005285513476718703, "2": 0.00015143258735443403, "1": 2.5798355354661636e-07}, "score": 4.436693482171897}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9416460689409167, "4": 0.05834533920271668, "3": 6.255809537235593e-06, "2": 2.301383716633209e-06, "1": 0}, "score": 4.9416352430039545}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5466606024351306, "5": 0.4531975571807627, "3": 0.00010613454248143119, "2": 3.555061863635177e-05, "1": 5.344819339249015e-08}, "score": 4.453020207162467}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9210481757553577, "5": 0.07800416939024928, "3": 0.0007647259680578162, "2": 0.00018163833831665965, "1": 0}, "score": 4.076876265958071}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8960371811938873, "5": 0.10372382923797084, "3": 0.00019106459373419168, "2": 4.682239237122834e-05, "1": 0}, "score": 4.103439233909735}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8369161690167468, "5": 0.1597282572242724, "3": 0.00224307766172949, "2": 0.0011104039621493782, "1": 0}, "score": 4.155264696472965}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6076508632678996, "4": 0.3923289001447116, "3": 1.547507334228997e-05, "2": 4.165059486393674e-06, "1": 0}, "score": 4.607627420497731}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6992484944464933, "4": 0.30074302993706914, "3": 5.872389130673944e-06, "2": 2.299660625607593e-06, "1": 0}, "score": 4.699238235001542}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8366483066568802, "5": 0.15967712042374785, "3": 0.002580940529917198, "2": 0.0010928389799398457, "1": 3.8420060957679693e-07}, "score": 4.154909412722435}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8870038696989997, "5": 0.11276987964492181, "3": 0.00012797763959102135, "2": 9.812385997680203e-05, "1": 0}, "score": 4.112445671057381}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7826114410741081, "4": 0.2173233374738056, "3": 5.251067897520435e-05, "2": 1.227901316046609e-05, "1": 0}, "score": 4.782534710235961}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8516260644367928, "5": 0.1479904254819813, "3": 0.000264219066912434, "2": 0.00011909286393271256, "1": 6.90294232036776e-08}, "score": 4.147487832642704}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6992330272408641, "4": 0.3007363835895499, "3": 2.433984107017398e-05, "2": 6.1540755781345565e-06, "1": 0}, "score": 4.699196445849153}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9502768203416566, "5": 0.04046766576153884, "3": 0.0071429673052016635, "2": 0.002111457102336631, "1": 6.15394691618477e-07}, "score": 4.029099951863718}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9868649181090935, "3": 0.011135723556575172, "5": 0.001507056301573721, "2": 0.0004892695467538577, "1": 0}, "score": 3.9893927614851883}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8081870901892894, "5": 0.18033091486382966, "3": 0.010829713203404338, "2": 0.0006503748298318791, "1": 9.185568865710359e-07}, "score": 4.168197862569596}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.826417743970923, "5": 0.17322656794776028, "3": 0.00034502116327093626, "2": 1.0418734272359755e-05, "1": 0}, "score": 4.172860752217178}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8981456051537962, "5": 0.10076915219430022, "3": 0.0010192652035164007, "2": 6.414926015606994e-05, "1": 0}, "score": 4.099621770597821}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8300818737368119, "2": 0.09913913613643949, "3": 0.0681372653751735, "5": 0.002601008563847232, "1": 3.827911924014065e-05}, "score": 3.736069990342564}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9516973256352415, "5": 0.04738221650015978, "3": 0.0006973256776647963, "2": 0.0002228786734072058, "1": 1.8505125429429223e-07}, "score": 4.046238581487515}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9848738402279215, "5": 0.011646592861325553, "3": 0.002899066182149985, "2": 0.0005798497150394914, "1": 0}, "score": 4.007587832188879}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8962251088556217, "5": 0.10374559278026071, "3": 2.586321161370012e-05, "2": 3.237160504215387e-06, "1": 0}, "score": 4.103713275782038}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7979100637111838, "5": 0.20174325597984266, "3": 0.000303308687628132, "2": 4.3018319418871047e-05, "1": 7.21506170097074e-08}, "score": 4.201353750812396}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9134826922293474, "5": 0.08496713026885087, "3": 0.00103667064898692, "2": 0.0005131891845383043, "1": 1.4050946273689724e-07}, "score": 4.082903674409516}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6781317624679961, "5": 0.32032675333139315, "3": 0.0012688257658894006, "2": 0.0002701487026548001, "1": 1.5814585560714572e-06}, "score": 4.318513181451875}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8935245218923942, "2": 0.07334495914995699, "3": 0.028277000724389937, "5": 0.004762623057585683, "1": 8.860422635209536e-05}, "score": 3.8295295008149512}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8266807188721738, "4": 0.17328169741231392, "3": 3.210216771647834e-05, "2": 5.323061234939377e-06, "1": 6.596866370619066e-08}, "score": 4.826637849154792}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.958827054287011, "2": 0.025954257949447702, "3": 0.014788290408231331, "5": 0.0003532641078148778, "1": 6.956179943461725e-05}, "score": 3.9334472685018342}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9678275581324127, "3": 0.01691462748081926, "2": 0.0077440807626580135, "5": 0.00750582044563706, "1": 5.166441005581947e-06}, "score": 3.9750874636882885}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6223666751799934, "4": 0.3774844512058566, "3": 0.00011351211348473008, "2": 3.355411665457825e-05, "1": 0}, "score": 4.622187179364358}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9279258151151795, "5": 0.0574952122421211, "3": 0.008413410147225782, "2": 0.006155382356448648, "1": 6.665583908459545e-06}, "score": 4.036751169794285}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8663471713937702, "5": 0.13285863643094362, "3": 0.0005870830300576064, "2": 0.00020608538185942397, "1": 3.978383778265919e-07}, "score": 4.131858271655421}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9521834577842131, "5": 0.044534210940238246, "3": 0.003078316568772705, "2": 0.0002030368638680144, "1": 0}, "score": 4.041049860784045}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt4", "target_model": "human", "scores": {"4": 0.984215536261189, "5": 0.00878543537204678, "3": 0.0045578238283118045, "2": 0.0024396272932800693, "1": 1.2095223842982417e-06}, "score": 3.9993447281490635}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9837095630500543, "2": 0.011632821925114932, "3": 0.004147810393508044, "5": 0.0004953853071042161, "1": 1.0774815985846131e-05}, "score": 3.9730495083941197}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9508091215398439, "5": 0.04310173618367008, "3": 0.004072221114519678, "2": 0.0020158956319080525, "1": 4.3662462180406575e-07}, "score": 4.03499643454106}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9016957426121088, "5": 0.09805485617786897, "3": 0.00022478796002201075, "2": 2.4444556618989475e-05, "1": 0}, "score": 4.097781195599651}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9842603456619194, "3": 0.00878583072553391, "2": 0.0058526250025368026, "5": 0.0010996756569224644, "1": 0}, "score": 3.9806085653940695}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9434843797070314, "5": 0.053227739465580126, "3": 0.0022315684498463856, "2": 0.001054118295859547, "1": 1.1594671637157908e-06}, "score": 4.048884506599143}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8479385673306458, "5": 0.1520270216382377, "3": 3.2927660787785666e-05, "2": 1.380489377888812e-06, "1": 0}, "score": 4.1519913486357085}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9700726882035234, "5": 0.01776750592125532, "3": 0.00752323535625316, "2": 0.004634930846150508, "1": 6.381075462612347e-07}, "score": 4.0009724955240795}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9281722167677096, "5": 0.07157295498816904, "3": 0.00019791696181675254, "2": 5.670415894049468e-05, "1": 0}, "score": 4.071261644468422}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.995617372563838, "5": 0.002627054558834779, "3": 0.0012216938274426325, "2": 0.0005337185061678742, "1": 1.289594271852086e-07}, "score": 4.000337536851436}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5389284837963388, "5": 0.46096996036807236, "3": 9.090705018476967e-05, "2": 9.732419779827577e-06, "1": 0}, "score": 4.4608600107946}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8523388073416169, "5": 0.14355727420948178, "3": 0.0027555285599162377, "2": 0.001342937365875906, "1": 3.176371660048527e-06}, "score": 4.138106656154499}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9376978663191116, "5": 0.06184787735330881, "3": 0.00038541005983592705, "2": 6.8028964156391e-05, "1": 0}, "score": 4.061326459487495}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5698404326865364, "5": 0.4301381254063488, "3": 1.4972820007784424e-05, "2": 5.863440562267334e-06, "1": 0}, "score": 4.430111686200873}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6992222521429367, "4": 0.30073172221173006, "3": 3.541372858036182e-05, "2": 9.681574644681387e-06, "1": 0}, "score": 4.6991681257306155}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9045874188549613, "2": 0.05024213810024206, "3": 0.027746343867287516, "5": 0.017363213108174232, "1": 5.88275073720496e-05}, "score": 3.888955881927089}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5156098830727779, "4": 0.48437065947429636, "3": 1.739583061995425e-05, "2": 1.777095976214714e-06, "1": 0}, "score": 4.515589079748874}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9284019966023411, "4": 0.07159067148685488, "3": 6.363608291873737e-06, "2": 7.600246271851899e-07, "1": 0}, "score": 4.928394306308798}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9496675870387834, "4": 0.05033053139670268, "3": 1.4524365971738835e-06, "2": 3.449839302449608e-07, "1": 0}, "score": 4.949665524542969}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9937469919368132, "3": 0.004748041793194365, "5": 0.0007873025097383542, "2": 0.0007168470926572768, "1": 0}, "score": 3.994605562125767}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8778962663431117, "5": 0.11881033272928965, "3": 0.0028828479555289112, "2": 0.0004088747841572856, "1": 7.075362301836502e-07}, "score": 4.115107724326262}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8027042252991858, "5": 0.19671112440514674, "3": 0.0004652693838548869, "2": 0.00011763852295419313, "1": 3.252996758280111e-07}, "score": 4.196009879839837}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7732538797273959, "5": 0.20811846877522727, "3": 0.009887113860011433, "2": 0.008725347356961313, "1": 1.31180291887989e-05}, "score": 4.1807416806558955}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5466339479139983, "5": 0.45317545980661295, "3": 0.0001240778955088777, "2": 6.538445623482692e-05, "1": 0}, "score": 4.452921124766735}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9693336144369745, "5": 0.017207731333880854, "3": 0.010601375734627643, "2": 0.0028533215704811994, "1": 2.7697015146921366e-06}, "score": 4.000891404412043}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9181772961026524, "5": 0.08022943592222857, "3": 0.0010258435799964387, "2": 0.0005665246305370377, "1": 0}, "score": 4.0780706133263305}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5312055143201593, "4": 0.46878722102339754, "3": 5.910048619088425e-06, "2": 1.0762998112989664e-06, "1": 0}, "score": 4.531197599508467}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6579191944402492, "5": 0.34132396797515463, "3": 0.0005548581846625375, "2": 0.00020095621690019414, "1": 0}, "score": 4.34036754561499}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8175190612244876, "5": 0.18241315175888767, "3": 4.6918148300218345e-05, "2": 2.0497020988780582e-05, "1": 0}, "score": 4.182325307365789}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.817567001947846, "4": 0.18242384148278662, "3": 5.872835449207765e-06, "2": 3.0947668061922503e-06, "1": 0}, "score": 4.81755509406981}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9198334940932544, "5": 0.06259545545980968, "3": 0.009599320156953481, "2": 0.007958115924850488, "1": 1.2152957526258122e-05}, "score": 4.037043498716226}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9727128096744742, "5": 0.02360217760049225, "3": 0.003194206432301381, "2": 0.0004898474215214356, "1": 3.1183519807117625e-07}, "score": 4.019427353389751}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9678120343028818, "5": 0.024228697530852196, "3": 0.005937500650876965, "2": 0.002020132854858151, "1": 8.977780136846223e-07}, "score": 4.014248248335503}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.705720416884645, "5": 0.29418804713653335, "3": 8.846429797987028e-05, "2": 2.756189356969041e-06, "1": 0}, "score": 4.294094163244044}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.7032559576864947, "4": 0.1952871381802704, "3": 0.10131363262803099, "1": 0.00013442085107250046, "5": 4.253961038584634e-06}, "score": 2.4917685105295315}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8486051478047401, "2": 0.11849183781233917, "3": 0.030910442722096552, "5": 0.0019454032440134933, "1": 4.575145332868883e-05}, "score": 3.733913653502617}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6001731392357855, "4": 0.39980150201777326, "3": 2.2944965814671e-05, "2": 2.3076358478375816e-06, "1": 0}, "score": 4.600145642700602}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8953242193940987, "5": 0.10364128755758976, "3": 0.0009107933728380972, "2": 0.00012326254071432869, "1": 1.5851065847356173e-07}, "score": 4.102483522125727}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8311368804013525, "4": 0.16885569576968684, "3": 6.660373459394234e-06, "2": 6.492422002193586e-07, "1": 0}, "score": 4.831129016469481}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9840090006201695, "5": 0.015415675463781127, "3": 0.0004728438267484242, "2": 0.00010225968998009802, "1": 0}, "score": 4.014738315505388}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7472943340271752, "2": 0.2208997942441307, "3": 0.030366319376756858, "5": 0.0013982329753787917, "1": 3.500407761412931e-05}, "score": 3.529124339156954}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8094657474319591, "2": 0.15939325953510727, "3": 0.030899795908597722, "5": 0.00016992880546737356, "1": 5.781536425781084e-05}, "score": 3.6503054633091514}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6343318555630038, "2": 0.3290870412952475, "3": 0.03361835773678785, "5": 0.0027595628485619678, "1": 0.00019990206227057583}, "score": 3.310365153991404}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9714489336331349, "2": 0.016200447721436292, "3": 0.008019803168387206, "5": 0.00429269130035206, "1": 3.277508286561285e-05}, "score": 3.963773473661407}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7858439131908056, "2": 0.18665428807571735, "3": 0.026890102416174705, "5": 0.00053252948021873, "1": 7.671816851515233e-05}, "score": 3.6001027171911564}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9697887351701209, "5": 0.025048859034839, "2": 0.0030387713695799027, "3": 0.002121404308340582, "1": 9.281690080487421e-07}, "score": 4.016847149414429}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5698274974555299, "4": 0.4301283613817242, "3": 3.705723309648146e-05, "2": 6.748623498660268e-06, "1": 0}, "score": 4.569777134025213}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5466652982698741, "5": 0.45320145016449925, "3": 0.00011656715654646264, "2": 1.6276422006747775e-05, "1": 0}, "score": 4.453052515003509}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6925996654838494, "5": 0.3073392477416912, "3": 5.103861780078765e-05, "2": 9.74089066933867e-06, "1": 0}, "score": 4.307268821755811}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7718042679721185, "5": 0.22814490583440317, "3": 4.096571748247051e-05, "2": 9.730210771269524e-06, "1": 0}, "score": 4.228084509406859}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9865240497026011, "3": 0.0102953041033734, "4": 0.0020591903652778095, "1": 0.0011195623824335756, "5": 0}, "score": 2.01329414762325}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5156133892319037, "5": 0.4843739532059795, "3": 7.964447364479661e-06, "2": 4.398385571228303e-06, "1": 0}, "score": 4.484357334741714}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9545787980065666, "5": 0.04194126046308133, "3": 0.0019012665683076461, "2": 0.0015762053465499639, "1": 1.4599476194159362e-06}, "score": 4.036883240598638}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6224230330339943, "4": 0.37751865284644676, "3": 3.8624066164867145e-05, "2": 1.9120299236861845e-05, "1": 0}, "score": 4.622346522953873}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7248480299221566, "4": 0.27512126909245477, "3": 2.370276144367409e-05, "2": 6.582019136818471e-06, "1": 0}, "score": 4.724811464792456}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7868350389253981, "2": 0.10648654924265268, "3": 0.10648654924265268, "5": 0.0001626171325768373, "1": 1.2737158122642167e-05}, "score": 3.680659486161695}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6925081860359288, "2": 0.2112030681563722, "3": 0.09226778715126467, "5": 0.003929235112130742, "1": 8.680815405363854e-05}, "score": 3.4889923753840657}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9694330877094576, "5": 0.02583451733548139, "3": 0.0029441974845954275, "2": 0.0017857460426559406, "1": 8.44797401394478e-07}, "score": 4.019316324407565}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.959836494744968, "5": 0.03721690073656924, "3": 0.0026130365625110863, "2": 0.00033221008600591213, "1": 2.801703572608733e-07}, "score": 4.0339386400666335}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9493373159074028, "3": 0.03980089020428687, "2": 0.01038268255148921, "5": 0.0004706640443919133, "1": 4.989169973562339e-06}, "score": 3.939889233356814}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9863439160070585, "5": 0.009372269527006058, "3": 0.002602585252725403, "2": 0.0016803553333251194, "1": 6.90655286117505e-07}, "score": 4.003406902266001}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9798452607289052, "5": 0.016859170953629855, "3": 0.003022682792651355, "2": 0.0002725029822184344, "1": 0}, "score": 4.013291487281101}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9904620564977953, "5": 0.007104094294094066, "3": 0.001942151305391411, "2": 0.0004910527510468251, "1": 0}, "score": 4.004179840183239}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9071737242475739, "5": 0.09267362192793052, "3": 0.0001437518512656501, "2": 8.63296968709432e-06, "1": 0}, "score": 4.092512629023515}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9850430294927367, "5": 0.01164859158814642, "3": 0.002366554923831781, "2": 0.0009413505109588503, "1": 1.8276402446544473e-07}, "score": 4.007398789501302}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9854737282894016, "3": 0.008393835597319769, "5": 0.0036101437048210085, "2": 0.0025202864834792376, "1": 0}, "score": 3.9901757154337654}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9754414716768259, "2": 0.013485840443624088, "3": 0.008052763133900362, "5": 0.003009097737922015, "1": 7.117243901257876e-06}, "score": 3.967963183136046}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7541723320453876, "5": 0.24484390351505758, "3": 0.0008426073377461013, "2": 0.00013971806321836676, "1": 0}, "score": 4.243722210776541}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5621397806479472, "5": 0.437794901364209, "3": 4.9967887943065644e-05, "2": 1.4770479462969936e-05, "1": 0}, "score": 4.437715646226274}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9109893429312397, "5": 0.08742499965315856, "3": 0.0012277169163216546, "2": 0.0003572859915902594, "1": 0}, "score": 4.085482766702785}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9544740912283294, "5": 0.021087076801529762, "2": 0.012789962440830976, "3": 0.011645393324038075, "1": 2.8138131545550295e-06}, "score": 3.9838533064609236}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8805973719945432, "5": 0.11917589118102151, "3": 0.00018199542655898446, "2": 4.390844005429327e-05, "1": 0}, "score": 4.118906177918186}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9596125017661634, "5": 0.030368460277738794, "3": 0.0075593051831888735, "2": 0.0024541470792370295, "1": 4.116118295508905e-06}, "score": 4.017888538869745}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6297566147709356, "4": 0.370214800463433, "3": 2.562874461153419e-05, "2": 2.875465453354151e-06, "1": 0}, "score": 4.629725285823295}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.992413414524704, "3": 0.006184305297374198, "2": 0.0013585115868288708, "5": 3.853803046278126e-05, "1": 4.256812147495321e-06}, "score": 3.9911244304804154}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8103364477210695, "5": 0.18655005210621498, "3": 0.0027886973271940793, "2": 0.00032281504979312547, "1": 1.0600642907803101e-06}, "score": 4.183112714365984}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8519141416005888, "4": 0.14804048430834968, "3": 4.2478181089121694e-05, "2": 2.7583027859793503e-06, "1": 0}, "score": 4.851866264036847}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8069990725252689, "5": 0.1916790922162221, "3": 0.0011577142406688607, "2": 0.00016165308007495482, "1": 1.0073544702106576e-06}, "score": 4.190195327548111}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5389103222124593, "5": 0.4609544259421645, "3": 0.00010965121526869072, "2": 2.485178442879271e-05, "1": 1.225090416864651e-07}, "score": 4.460794992243699}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9304155822628395, "5": 0.06136755522630109, "3": 0.00617189720299418, "2": 0.002035275679949617, "1": 8.71688158850821e-06}, "score": 4.051099005725012}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9667826365756585, "5": 0.028296094143182796, "3": 0.003597444668007424, "2": 0.001323425934111756, "1": 2.911558925464429e-07}, "score": 4.022050926510261}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9794860055892641, "5": 0.01970313734158601, "3": 0.0007289889382055704, "2": 8.179029209039193e-05, "1": 8.99643820453059e-08}, "score": 4.018810297697969}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7057241572127664, "5": 0.294189606337315, "3": 7.685953675292358e-05, "2": 9.179562614006693e-06, "1": 0}, "score": 4.294094445715034}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7310022582323422, "5": 0.26892068342912795, "3": 7.025788598755872e-05, "2": 6.637912675470562e-06, "1": 0}, "score": 4.268837193414551}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6368477009414947, "5": 0.36286486019394665, "3": 0.00023099857876358518, "2": 5.573100071819969e-05, "1": 0}, "score": 4.362522656745657}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9189984070310881, "5": 0.07543597467855437, "2": 0.003583749429347688, "3": 0.0019791344031275864, "1": 1.5926743078676771e-06}, "score": 4.06628463907652}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9510687031368886, "2": 0.025345121835173394, "3": 0.023076996041364723, "5": 0.0005019329564901405, "1": 4.342570951953906e-06}, "score": 3.926721452770656}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7908732375489596, "5": 0.20631160653856975, "3": 0.0024781506565105045, "2": 0.0003353814557687837, "1": 6.576341916200986e-07}, "score": 4.203160916355115}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7548918613435897, "5": 0.24507752252935963, "3": 2.2830116374453856e-05, "2": 7.296943471679183e-06, "1": 0}, "score": 4.245040218367176}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8516356538002664, "5": 0.14799208298402866, "3": 0.0002560924617456732, "2": 0.00011542991600594289, "1": 1.630274900086022e-07}, "score": 4.1475047268375755}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9616899890087072, "5": 0.018173096369548516, "3": 0.010851651484776981, "2": 0.009281909391072644, "1": 2.581375917058038e-06}, "score": 3.988749873285615}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9045503586675939, "5": 0.09533891591461177, "3": 0.00010324125779233686, "2": 7.136293742976915e-06, "1": 0}, "score": 4.0952214351936576}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5232111332070928, "4": 0.4763891579744472, "3": 0.00035455559421000216, "2": 4.437785385550081e-05, "1": 0}, "score": 4.522768227244177}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6001596955080369, "4": 0.3997925465644295, "3": 4.354093621401902e-05, "2": 3.987149473697711e-06, "1": 0}, "score": 4.600108318202879}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.8248385654808205, "3": 0.1226013063688112, "4": 0.05191265937293122, "1": 0.0006333780998513697, "5": 0}, "score": 2.2257964286394984}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9846054090705608, "5": 0.012394351925713237, "3": 0.0016513875583678021, "2": 0.001347823243620841, "1": 5.715642137534079e-07}, "score": 4.008045606861389}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8265534859680205, "5": 0.1732550314110836, "3": 0.00018184316011934923, "2": 9.340824811874974e-06, "1": 0}, "score": 4.173054558281655}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9910133098656596, "5": 0.007108048822814289, "3": 0.0014440877090742417, "2": 0.0004335937596038264, "1": 0}, "score": 4.004796778198686}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9121504002039926, "5": 0.0875364150669922, "3": 0.0002965780904513052, "2": 1.5965586433917855e-05, "1": 0}, "score": 4.087207961708523}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8632810281037783, "5": 0.1365908934336505, "3": 0.00011700838021058767, "2": 1.0883474718654918e-05, "1": 0}, "score": 4.136452143567015}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt4", "target_model": "human", "scores": {"5": 0.5850777702428669, "4": 0.4148822640859046, "3": 2.963258374134865e-05, "2": 9.620291425831757e-06, "1": 0}, "score": 4.585029314082864}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9826501357394893, "2": 0.00786268364620793, "5": 0.0054039381725638205, "3": 0.004079106539351278, "1": 2.2560907479101334e-06}, "score": 3.985592668985485}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9454367820914956, "5": 0.05333789632406037, "2": 0.0006406780431511148, "3": 0.0005833439965977746, "1": 0}, "score": 4.051473263132967}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5774849716740689, "4": 0.4224970307585575, "3": 1.2192396966034018e-05, "2": 5.243884591647387e-06, "1": 0}, "score": 4.577462615629495}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.5640060108530504, "4": 0.3018906540057811, "3": 0.1339631522573674, "1": 0.00010286789147684027, "5": 1.4363576003966564e-05}, "score": 2.7377016144023365}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9321574749787284, "2": 0.055980402771661504, "3": 0.01085229826247925, "5": 0.0009482632541576895, "1": 5.8755370285656963e-05}, "score": 3.877958550966971}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7606482870736556, "4": 0.23934862688736386, "3": 2.1734191180008868e-06, "2": 6.424614641194453e-07, "1": 0}, "score": 4.760645034226254}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9091657119903643, "5": 0.09001958690973169, "3": 0.0006981317635660656, "2": 0.00011576155995071803, "1": 0}, "score": 4.089090003991066}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9539654711041746, "4": 0.046033876862926634, "3": 4.115324344034228e-07, "2": 1.1250659441473256e-07, "1": 0}, "score": 4.9539649566602195}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6442005875654498, "5": 0.3557613279761832, "3": 3.0175054042890373e-05, "2": 7.280070585443534e-06, "1": 0}, "score": 4.355716816645564}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9131248324207341, "5": 0.08493382968112709, "3": 0.0011204689230534153, "2": 0.0008197525758548908, "1": 4.001177332583725e-07}, "score": 4.082172714111958}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9827149505319634, "5": 0.016388326440698858, "3": 0.0004796585794325359, "2": 0.00041673459567663414, "1": 2.3780591004305765e-07}, "score": 4.015074486639733}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8773480333563715, "5": 0.12250523686411059, "3": 0.00011346944095299842, "2": 3.3021489878586075e-05, "1": 0}, "score": 4.122325753660745}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8030993171948086, "5": 0.19680794977139393, "3": 4.906321447401424e-05, "2": 4.329813480416126e-05, "1": 6.822014053033698e-08}, "score": 4.196672145309879}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9193315675687375, "5": 0.08033029953477455, "3": 0.0002478075800129466, "2": 8.97499578709906e-05, "1": 1.4363607402606964e-07}, "score": 4.079902595626548}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8803083105248257, "3": 0.08716232449281806, "4": 0.031078683898108375, "1": 0.0014310340273061513, "5": 1.338691259871111e-05}, "score": 2.1479297450610817}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7568079322473836, "5": 0.2381401769283477, "3": 0.002524351704282868, "2": 0.002524351704282868, "1": 0}, "score": 4.230567856731106}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9523663564636876, "5": 0.03061376605827646, "3": 0.011439526314075769, "2": 0.005575179861521745, "1": 2.2209955869928406e-06}, "score": 4.008017240687716}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6001489527456354, "4": 0.3997853903418944, "3": 5.67870642642989e-05, "2": 8.57356436431397e-06, "1": 0}, "score": 4.600075196345227}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.9400929646917384, "3": 0.051404662526637904, "4": 0.00764061944425096, "1": 0.000843963255882723, "5": 0}, "score": 2.065843109513541}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5925535679603094, "5": 0.4072557143684584, "3": 0.00015724766680215015, "2": 3.2960901564672326e-05, "1": 1.8411808847559853e-07}, "score": 4.407032124823505}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6297192650137314, "4": 0.37019286958825254, "3": 6.24445559332798e-05, "2": 2.4838728246887627e-05, "1": 0}, "score": 4.629607509504547}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8120896406697856, "5": 0.18120170063761493, "3": 0.0056455102259501035, "2": 0.0010607599433917656, "1": 9.672885392633204e-07}, "score": 4.173432015146864}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9324492523662552, "4": 0.06754639391086119, "3": 2.7921713588534566e-06, "2": 1.2585302325170815e-06, "1": 0}, "score": 4.932444225684885}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6150833450199691, "4": 0.38490932188760035, "3": 6.529879944937485e-06, "2": 7.441695040782706e-07, "1": 0}, "score": 4.615075363116899}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9886129528300869, "3": 0.006661224183398326, "5": 0.002528315520907866, "2": 0.002196638591547787, "1": 2.282776923925835e-07}, "score": 3.991473123859051}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8128168837853128, "5": 0.18712107719796722, "3": 4.9656810832140674e-05, "2": 1.1794526382518271e-05, "1": 0}, "score": 4.187047941258612}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8658694693617758, "5": 0.13278539837240397, "3": 0.001029794511543355, "2": 0.00031406958133394533, "1": 6.062969223494197e-07}, "score": 4.131125732596403}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9941911151940002, "5": 0.005382641716231978, "3": 0.000272206115789412, "2": 0.0001503264943940616, "1": 1.1658314902395924e-06}, "score": 4.004806297347519}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7825186601618156, "5": 0.21729758618410905, "3": 0.0001146803345162113, "2": 6.84787554647454e-05, "1": 2.0474777114729087e-07}, "score": 4.217045418703197}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt4", "target_model": "human", "scores": {"2": 0.6673308026600357, "4": 0.2166505916278086, "3": 0.11596469356771529, "1": 3.379848766889972e-05, "5": 0}, "score": 2.5492431256233763}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9101953155763662, "5": 0.08734878081232943, "3": 0.001625043003269708, "2": 0.0008299907515056402, "1": 0}, "score": 4.084063829429519}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9763715632165035, "5": 0.014369289836215278, "3": 0.005204211902513222, "2": 0.0040530443049468234, "1": 5.757098706134747e-07}, "score": 4.00105726358453}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6075917295633791, "5": 0.39229069309364906, "3": 0.00010090036632868024, "2": 1.6216164574012253e-05, "1": 0}, "score": 4.3921575411091}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.4999760408540317, "5": 0.4999760408540317, "3": 4.110236070638639e-05, "2": 6.605750502669104e-06, "1": 0}, "score": 4.499921832066255}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt4", "target_model": "human", "scores": {"4": 0.951357773032865, "5": 0.03926722804393923, "3": 0.006823619700839151, "2": 0.0025498003933328212, "1": 8.035390926472212e-07}, "score": 4.0273416181368376}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9245361377055318, "5": 0.04899862708193808, "3": 0.015179066565182574, "2": 0.01128012445193642, "1": 4.355422227525117e-06}, "score": 4.011246264338591}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.545896380801134, "5": 0.45256399519343615, "3": 0.00137445086299673, "2": 0.00016415474630445385, "1": 0}, "score": 4.450861693993634}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.966780296964509, "5": 0.03107710203335677, "3": 0.0015232501048539388, "2": 0.0006154486770350067, "1": 0}, "score": 4.028323065097271}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.980866666064807, "5": 0.015366451806020925, "3": 0.0033755614936717966, "2": 0.00039074960482014516, "1": 0}, "score": 4.011209397503619}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8611822107989814, "2": 0.09076795265523525, "3": 0.047089793497931846, "5": 0.0009325625788608773, "1": 2.6044628777195173e-05}, "score": 3.772228402840508}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.972260953377971, "3": 0.012238959667444765, "2": 0.009531711372985323, "5": 0.005964792561380439, "1": 2.692591352463162e-06}, "score": 3.974654309805373}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt4", "target_model": "gpt35", "scores": {"2": 0.8229857608282516, "3": 0.11137900881381041, "4": 0.06547634150406567, "1": 0.00010478845021738949, "5": 5.187404444087172e-05}, "score": 2.2423830651368175}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9765328516388553, "2": 0.01084829884247809, "3": 0.010514531775661019, "5": 0.0021030386582514024, "1": 8.918244755666182e-07}, "score": 3.969889222063499}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8505396488070106, "2": 0.10813397623213647, "3": 0.038556356608422514, "5": 0.002749711450224476, "1": 1.7404896209088134e-05}, "score": 3.747872456013258}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9556585117750058, "5": 0.02318836580528721, "2": 0.015446775545135861, "3": 0.005682551155445282, "1": 2.286324405496094e-05}, "score": 3.986543661279705}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9510742060363248, "5": 0.047351191310211094, "3": 0.000908888348739746, "2": 0.000664956920905504, "1": 3.145766721179097e-07}, "score": 4.045111465365324}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.956754328993868, "5": 0.02395187907395938, "2": 0.011138658206355458, "3": 0.00814921642926442, "1": 4.507201982376533e-06}, "score": 3.993511815477083}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9741545221027041, "5": 0.025161624058705034, "3": 0.00047548011309381114, "2": 0.00020772198144807026, "1": 1.4984191478921139e-07}, "score": 4.024270262638268}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9612410326965721, "5": 0.03845448287883083, "3": 0.0002472390192436878, "2": 5.691765407589438e-05, "1": 0}, "score": 4.038093421036602}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9933354701454229, "3": 0.0033132963798723153, "5": 0.0030167906841967007, "2": 0.00033322687288777616, "1": 0}, "score": 3.9990370393876686}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9706187337420867, "5": 0.028408365992318677, "3": 0.0006786219229438733, "2": 0.00029187176882769744, "1": 9.145616111314366e-07}, "score": 4.027143297345017}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9788764447334808, "5": 0.014863451482601021, "3": 0.003938422565207328, "2": 0.002315279186026105, "1": 4.61141871966536e-06}, "score": 4.006280647535398}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9462090890375051, "5": 0.053381464500696606, "3": 0.00032749361475838405, "2": 8.151960618189136e-05, "1": 0}, "score": 4.052890954588097}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9818566538097795, "5": 0.016374009300891165, "3": 0.0014994078732131026, "2": 0.0002688290183421742, "1": 3.403436481250743e-07}, "score": 4.0143359332504}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7013400758389864, "2": 0.2138966552491301, "3": 0.08376313372290682, "5": 0.0009018948671146627, "1": 9.655603930349e-05}, "score": 3.489054921952154}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9233036195310368, "5": 0.07345757134901416, "3": 0.002253158430969835, "2": 0.000984332019139419, "1": 8.564910232266283e-07}, "score": 4.0692332114048195}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9726221346947803, "5": 0.022170125379550872, "3": 0.003144392409568029, "2": 0.0020621428879152902, "1": 4.06671541770023e-07}, "score": 4.014900239069271}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7548220899133821, "5": 0.24505487841245222, "3": 6.503090106733397e-05, "2": 5.738956876420749e-05, "1": 0}, "score": 4.244875218042651}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9067098235403415, "5": 0.09262624075407534, "3": 0.00037267344662220175, "2": 0.0002902383720592904, "1": 2.646631371927687e-07}, "score": 4.091672366173762}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9067604919009417, "3": 0.051155922826682576, "4": 0.03861451642587345, "1": 0.0034272331676110978, "5": 3.3599411702586134e-05}, "score": 2.125059550769801}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.94334410344371, "4": 0.05665222590766445, "3": 2.3055322433338093e-06, "2": 1.234062482063447e-06, "1": 0}, "score": 4.943339453414817}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8558263975576184, "4": 0.1441446888763522, "3": 2.3566437452014985e-05, "2": 4.863209242578245e-06, "1": 0}, "score": 4.8557935188367125}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9850419873177628, "4": 0.014957072710714838, "3": 5.899689078468055e-07, "2": 2.9665499688640184e-07, "1": 0}, "score": 4.9850408565884425}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9093869843886043, "5": 0.08727122334258394, "3": 0.0022191977994505977, "2": 0.001115882731327384, "1": 2.518467440439809e-06}, "score": 4.082813051935694}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9584448317620515, "5": 0.025541688974611537, "2": 0.009847198307937923, "3": 0.006162219240512939, "1": 3.103227062568655e-06}, "score": 3.999675763126258}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6140495830145947, "5": 0.38426241015490026, "3": 0.0010625809200698415, "2": 0.0006246590981475, "1": 2.909310614716342e-07}, "score": 4.3819498200081}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5388010422804742, "4": 0.4608609538629726, "3": 0.0002756071708813954, "2": 6.149627217682141e-05, "1": 0}, "score": 4.538402927350502}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6297464757710569, "4": 0.370208840053127, "3": 3.969390136824138e-05, "2": 4.891248353712099e-06, "1": 0}, "score": 4.629697061729422}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.998266467805694, "3": 0.0008961883096959284, "2": 0.000615940617031815, "5": 0.0002196203904396206, "1": 7.558030579964332e-07}, "score": 3.998089281475056}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9259065197738554, "5": 0.07366466783221189, "3": 0.000357506505068483, "2": 7.039720480943175e-05, "1": 1.9164770886091401e-07}, "score": 4.073165844436968}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9925213334419098, "5": 0.006481800190650998, "2": 0.000612395648411749, "3": 0.0003832274043275078, "1": 6.427525650920838e-07}, "score": 4.004871856157657}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9097588942051342, "5": 0.0900783348497259, "3": 0.00012524972670471048, "2": 3.702374849508241e-05, "1": 0}, "score": 4.089879082338172}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9342542607657218, "5": 0.065594934762469, "3": 0.00012662805111620477, "2": 2.3423834163009245e-05, "1": 0}, "score": 4.065421508278373}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.909613390816636, "5": 0.09006392346909116, "3": 0.00021978516751613007, "2": 0.00010220959500627875, "1": 1.9731093544202985e-07}, "score": 4.089639171428309}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8736716416243807, "5": 0.12586431718321953, "3": 0.0003882733329480499, "2": 7.527021895456374e-05, "1": 0}, "score": 4.1253255657794385}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5774712392447217, "4": 0.4224869838986237, "3": 2.834749192381021e-05, "2": 1.2978427525271714e-05, "1": 0}, "score": 4.577417195276644}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9422377195802037, "5": 0.053157418886151164, "3": 0.0032936859229390106, "2": 0.0013101377429586335, "1": 0}, "score": 4.047243506509807}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6513473469517018, "4": 0.34864111836424455, "3": 6.102347651032127e-06, "2": 5.059023891965401e-06, "1": 0}, "score": 4.651331369706416}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5926018037839127, "5": 0.4072888663328746, "3": 9.24486687417089e-05, "2": 1.657513296339897e-05, "1": 0}, "score": 4.40716339202339}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9362757417524724, "5": 0.03305457485582254, "3": 0.021341637547362274, "2": 0.009323469086123476, "1": 3.892454976640306e-06}, "score": 3.9930543170183297}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8149789453511054, "2": 0.16557301553112422, "3": 0.01916646771476563, "5": 0.00022313847836873086, "1": 5.217834478563532e-05}, "score": 3.649751914012376}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8684577079466489, "5": 0.12511318141920483, "3": 0.004557247300063702, "2": 0.001870290523541808, "1": 6.473291106385172e-07}, "score": 4.116813519193468}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5389425823498832, "5": 0.46098201949996837, "3": 6.970273509544891e-05, "2": 5.3748977897060175e-06, "1": 0}, "score": 4.46090171469625}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8618044587927186, "5": 0.13216197834553053, "3": 0.005540879701191961, "2": 0.0004917810307458387, "1": 0}, "score": 4.1256376499243155}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt4", "target_model": "human", "scores": {"5": 0.7824526027248483, "4": 0.21727922531383417, "3": 0.0002142328607897814, "2": 5.332677541114057e-05, "1": 1.1848884687488476e-07}, "score": 4.782131747091721}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7662837707085887, "4": 0.23370335068312284, "3": 1.077719748332478e-05, "2": 1.9935810775428945e-06, "1": 0}, "score": 4.7662690889755375}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9263011696602709, "4": 0.0736960556658423, "3": 1.6562890005288493e-06, "2": 6.692012499555077e-07, "1": 0}, "score": 4.926298591046941}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6001555844282032, "4": 0.3997898079948652, "3": 4.354058788792265e-05, "2": 1.0838109256481668e-05, "1": 0}, "score": 4.600090504970389}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9783835675276116, "4": 0.021615310412272735, "3": 9.967877283842386e-07, "2": 8.182115567026458e-08, "1": 0}, "score": 4.978382449609494}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9713750286096468, "5": 0.025886266548527815, "3": 0.0015067613995126108, "2": 0.0012297828129824435, "1": 1.5569340859752673e-06}, "score": 4.021915281950944}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9835911138437423, "5": 0.0060343025417563395, "2": 0.005668702632694465, "3": 0.004699519544809606, "1": 5.502571662527379e-06}, "score": 3.989980861411479}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9186486752308499, "2": 0.04296577115206167, "3": 0.025656033778488196, "5": 0.012700655152971472, "1": 2.7351860659072113e-05}, "score": 3.9010308737654174}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9829006746721816, "5": 0.015398317943130898, "3": 0.0012639709071722558, "2": 0.0004368166570450611, "1": 1.1591925103564708e-07}, "score": 4.013260367341884}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8520944001435048, "2": 0.09560233830180519, "3": 0.051172244169180016, "5": 0.0011130146991416186, "1": 1.6638221654619154e-05}, "score": 3.758685849996745}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7716047823534748, "5": 0.2280859379981662, "3": 0.00026292072423225233, "2": 4.568877106468549e-05, "1": 0}, "score": 4.227731792346963}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6723051427833241, "5": 0.3276553451607702, "3": 2.8228795047895725e-05, "2": 1.0714442074176026e-05, "1": 0}, "score": 4.327605873829949}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.990107950390037, "2": 0.004375143323727516, "5": 0.003801190392962324, "3": 0.001713330743089127, "1": 1.3363533958188668e-06}, "score": 3.9933335569504864}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8354783950403015, "4": 0.16451544871914267, "3": 3.212375061053775e-06, "2": 2.07406522450308e-06, "1": 0}, "score": 4.835471761228355}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6150399585710694, "5": 0.3848821867369326, "3": 6.594476897439107e-05, "2": 1.1459482554608502e-05, "1": 0}, "score": 4.3847934963294115}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9071934464187182, "5": 0.06995525189419981, "3": 0.011419878660338424, "2": 0.011419878660338424, "1": 9.334671236149843e-06}, "score": 4.0356676907142}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9627219422992784, "2": 0.026470070482904413, "3": 0.010205121263881432, "5": 0.0005757335448760995, "1": 2.032587201263602e-05}, "score": 3.9373690673993855}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.692508476889428, "5": 0.30729880455790826, "3": 0.00016217906397237558, "2": 3.0000110289266293e-05, "1": 0}, "score": 4.307076790903945}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8354754875805457, "4": 0.16451487291607983, "3": 7.1269370649091095e-06, "2": 2.1735929984854507e-06, "1": 0}, "score": 4.835464296657582}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8595093893661462, "5": 0.140311054935397, "3": 0.00013408736404080487, "2": 4.491364104011957e-05, "1": 0}, "score": 4.140087217994728}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.781342058494929, "3": 0.11256300158479117, "2": 0.1057431540782468, "5": 0.000297010816687954, "1": 5.242552326577846e-05}, "score": 3.6760896634775966}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9147377379341965, "5": 0.0850838702623764, "3": 0.00012206058965472212, "2": 5.588341010144695e-05, "1": 0}, "score": 4.084850080848697}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.976416111185318, "2": 0.01119132113198909, "3": 0.01119132113198909, "5": 0.0011981318822466961, "1": 1.4473995867881793e-06}, "score": 3.967619772300974}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5078072005085801, "4": 0.4921836154393085, "3": 5.829070524919761e-06, "2": 3.1200766161064914e-06, "1": 0}, "score": 4.507795250568452}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9800617383357926, "5": 0.01971472027871435, "3": 0.00013077725833473557, "2": 9.273496240737378e-05, "1": 0}, "score": 4.019398473661315}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt4", "target_model": "human", "scores": {"4": 0.973640402618161, "2": 0.015253239076851725, "5": 0.006067319314746026, "3": 0.005029984381222809, "1": 8.30553830518123e-06}, "score": 3.9705059180717512}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.986952460857428, "5": 0.0109640504404541, "3": 0.00187572786541482, "2": 0.00020397604448713771, "1": 2.7763234653715018e-06}, "score": 4.00867205026116}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8712567320940844, "2": 0.09182978303872262, "3": 0.023218205226348192, "5": 0.01364927325719047, "1": 4.552754639147337e-05}, "score": 3.8066348267237724}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6150632751778623, "5": 0.3848967740482377, "3": 3.214010277279303e-05, "2": 7.75416065458454e-06, "1": 0}, "score": 4.3848491473721625}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.995881186675162, "1": 0.00258701002665775, "3": 0.0013008303339309625, "4": 0.0002296101929781805, "5": 0}, "score": 1.9991730395662717}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9880307462818559, "2": 0.005266356087942456, "5": 0.004434716449448087, "3": 0.002265031529126215, "1": 1.7944876652931678e-06}, "score": 3.9916315779408578}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9193440705630765, "5": 0.0803313920342772, "3": 0.00020867761684837608, "2": 0.00011524272519869567, "1": 0}, "score": 4.079892278265409}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8291648911055772, "2": 0.1440872586615653, "3": 0.026240239176230005, "5": 0.00048060664898450477, "1": 2.4687562096619263e-05}, "score": 3.68599105995312}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6991596955265494, "5": 0.30070483799750664, "3": 8.494547312206615e-05, "2": 4.993686751749209e-05, "1": 0}, "score": 4.300520194333805}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9818088454277117, "5": 0.017982455335531295, "3": 0.00014165613806655514, "2": 6.691362161310387e-05, "1": 0}, "score": 4.017706974246885}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6909370632795292, "5": 0.3066014755296707, "2": 0.0016861092890545577, "3": 0.0007719570841221947, "1": 2.7841136326489772e-06}, "score": 4.302449132233433}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8477411223884672, "5": 0.15199160346857296, "3": 0.00017520479694740814, "2": 9.089505124609277e-05, "1": 3.9542488180624323e-07}, "score": 4.151633540397286}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5152825438114707, "5": 0.48406315269625266, "3": 0.0005847711405565065, "2": 6.875816945780319e-05, "1": 0}, "score": 4.483341239410994}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5620087836163464, "4": 0.43769288077341834, "3": 0.00020385267630286167, "2": 9.333055609787985e-05, "1": 5.549637725584056e-07}, "score": 4.561616940454388}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8440971958980954, "5": 0.13779508343918634, "2": 0.01475220818416981, "3": 0.003343498717668497, "1": 8.418212873842136e-06}, "score": 4.10492229096769}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt4", "target_model": "human", "scores": {"2": 0.7302799684057711, "4": 0.21587036791518582, "3": 0.0529013087684255, "1": 0.0005435155722606183, "5": 0.0004039064767479313}, "score": 2.485310701184502}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.7312873535228858, "4": 0.14857003734053, "3": 0.11937939071488098, "1": 0.00041083302139408566, "5": 0.00034595608947222354}, "score": 2.417149182624724}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9106997581257293, "5": 0.06806501007482556, "3": 0.011111307449848734, "2": 0.010116960561566435, "1": 6.440418728553468e-06}, "score": 4.036700479453562}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9530414195455897, "5": 0.02539769137084728, "2": 0.013176148706582323, "3": 0.008375269689986838, "1": 8.79042936917504e-06}, "score": 3.9906437466149254}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.6616915289470838, "4": 0.3029444571536428, "3": 0.03452468167015367, "5": 0.0004773164833401075, "1": 0.0003602973843072394}, "score": 2.641486350348582}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.583791546965365, "5": 0.4139701952078331, "3": 0.0017729928227156139, "2": 0.00046251281189540507, "1": 1.8036268565244567e-06}, "score": 4.4112671559945245}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6000451359572214, "5": 0.3997162334516087, "3": 0.000186165219807878, "2": 5.1696214481055564e-05, "1": 3.171547537546384e-07}, "score": 4.399425904879936}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9511257508996452, "4": 0.04885693233093888, "3": 1.5639137053136466e-05, "2": 1.548484263500048e-06, "1": 0}, "score": 4.951107137627744}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9678957730225745, "4": 0.03210058579330697, "3": 2.598032838189352e-06, "2": 6.672300152688571e-07, "1": 0}, "score": 4.967892204380967}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.8558379085000765, "4": 0.1441466348427873, "3": 1.2418801297569494e-05, "2": 2.858970394133592e-06, "1": 0}, "score": 4.855819924851717}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9643303561266642, "5": 0.027355945171690387, "3": 0.005645220618704002, "2": 0.0026666134031197077, "1": 8.403503069159061e-07}, "score": 4.016374993469215}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9762683886505028, "5": 0.021568576827745697, "2": 0.0011979506186058529, "3": 0.0009625803642145772, "1": 2.105638102893683e-06}, "score": 4.018203785555313}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9700587764908561, "5": 0.028391979093216144, "3": 0.0013279100017379631, "2": 0.00022018928393614578, "1": 4.3855833540128633e-07}, "score": 4.026622393659235}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.909142946765958, "5": 0.09001733644818984, "3": 0.0005269641701839335, "2": 0.00030978625447321755, "1": 2.2219441546132613e-06}, "score": 4.0888642000886195}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9871700002682124, "5": 0.011857579448036318, "3": 0.0006689588563175402, "2": 0.0003015233797582485, "1": 1.139651550200012e-06}, "score": 4.01058216332631}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt4", "target_model": "human", "scores": {"5": 0.6213141172846146, "4": 0.37684605014002814, "3": 0.0016914514034692474, "2": 0.00014779727303389272, "1": 1.6256807497130185e-07}, "score": 4.619326844572314}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7901656989565221, "3": 0.10045828623334545, "2": 0.05723940609766316, "5": 0.052117072331161814, "1": 1.518977581786097e-05}, "score": 3.8371336966594685}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5739232284228108, "4": 0.41989120372964195, "3": 0.0055393135158911585, "2": 0.0006412220815313668, "1": 1.745647519138867e-06}, "score": 4.567098097627385}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.91725744419891, "4": 0.08269326658810222, "3": 4.502728133506764e-05, "2": 3.996398409782995e-06, "1": 0}, "score": 4.917204667669085}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6439008334891672, "4": 0.3555957951766134, "3": 0.00045019249499969344, "2": 5.2113579508973686e-05, "1": 0}, "score": 4.643347099166894}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.92407783858099, "2": 0.03814124639017338, "3": 0.03313768912841345, "5": 0.004627058157393499, "1": 1.3834660281946643e-05}, "score": 3.895165127679356}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9820088337461056, "5": 0.011255425499079697, "3": 0.005234258957897375, "2": 0.0014996402994460177, "1": 9.696991191597425e-07}, "score": 4.003018979476875}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9686653875625691, "5": 0.023139573237927622, "3": 0.007281189771323035, "2": 0.0009113477592604323, "1": 9.565225239904245e-07}, "score": 4.0140328400633045}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8353910169244824, "5": 0.16449825775299515, "3": 0.00010471899850068358, "2": 5.7260764499874495e-06, "1": 0}, "score": 4.164382132669289}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9486604045390942, "3": 0.030021865884344523, "2": 0.019383573468842844, "5": 0.001919233675420765, "1": 1.2148194500521869e-05}, "score": 3.933093590655599}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6375666234739227, "2": 0.3307652069072977, "3": 0.03125044696568787, "5": 0.000326127874643889, "1": 8.50755391710977e-05}, "score": 3.307285524505431}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9822941232126594, "5": 0.016901300624243016, "3": 0.0005348684655936134, "2": 0.0002689489428255267, "1": 2.033191347466839e-07}, "score": 4.0158279331069915}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.976202147182659, "5": 0.02090356626246689, "3": 0.0020697333426059365, "2": 0.0008232830432078151, "1": 6.522512477095073e-07}, "score": 4.017185320698818}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6583737498646369, "5": 0.3415598018756969, "3": 5.497637557546103e-05, "2": 1.0995966876373265e-05, "1": 0}, "score": 4.341482996084006}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5311340401150447, "5": 0.46872414525876926, "3": 0.00010312012367532847, "2": 3.793577347120986e-05, "1": 0}, "score": 4.468545509087236}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9875838375754281, "5": 0.009989267623200477, "3": 0.0016054214037637966, "2": 0.0008199690191041679, "1": 6.198774746309324e-07}, "score": 4.0067420545121575}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9730357406940423, "5": 0.026753646424381713, "3": 0.00018310349839398605, "2": 2.7215905351374452e-05, "1": 0}, "score": 4.026516118897177}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.972551321627721, "5": 0.02512021194793347, "3": 0.002030024331580554, "2": 0.00029705834222056504, "1": 5.060744723152502e-07}, "score": 4.022494572451443}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7310126970191225, "5": 0.2689245290223969, "3": 5.386934393590861e-05, "2": 8.391225343971388e-06, "1": 0}, "score": 4.268854015254521}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9868309044221393, "5": 0.005426930990168787, "3": 0.004499083813205517, "2": 0.003240568505206821, "1": 1.7102311861653796e-06}, "score": 3.994441575014923}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9797820872422969, "5": 0.015836699170688955, "3": 0.0033195524810627525, "2": 0.001060992699655774, "1": 3.0443750772651737e-07}, "score": 4.0103942517609745}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8977012587733225, "2": 0.057388118032660446, "3": 0.039442238253838385, "5": 0.005421986596321075, "1": 4.5466125672158675e-05}, "score": 3.851066975062071}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6966048212202784, "5": 0.2996060002508705, "3": 0.003225920316458565, "2": 0.0005605808946479127, "1": 1.456226583152959e-06}, "score": 4.295254909998527}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.615070772844885, "5": 0.3849014544214668, "3": 2.27910418619793e-05, "2": 4.77726189930822e-06, "1": 0}, "score": 4.38486918753457}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6222926490667711, "5": 0.37743957097279096, "3": 0.000218774289757387, "2": 4.8815142309924755e-05, "1": 1.0512728319822211e-07}, "score": 4.377122883223269}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7480146841378613, "5": 0.25055352716159474, "3": 0.001215976282684103, "2": 0.00021463256324925526, "1": 3.4349853163819474e-07}, "score": 4.2489074634320865}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9884908716118423, "4": 0.011508139630781043, "3": 4.610768984237583e-07, "2": 6.961219983367887e-08, "1": 0}, "score": 4.9884907241067875}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.9958006822965574, "4": 0.004198793738765157, "3": 3.2426362324457137e-07, "2": 6.691564772013155e-08, "1": 0}, "score": 4.995800356429394}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9591505720370294, "4": 0.04084555403302879, "3": 3.0099653226022584e-06, "2": 5.744619346944153e-07, "1": 0}, "score": 4.9591466908233794}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9875678092198148, "4": 0.012431641781517299, "3": 3.1659736890647417e-07, "2": 1.495500077572265e-07, "1": 0}, "score": 4.987567275343655}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8262459000058416, "2": 0.11182020612734839, "3": 0.06175298281156213, "5": 0.00015307034055979979, "1": 2.311016485988625e-05}, "score": 3.714688995101796}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9639129338822501, "5": 0.035110522749722615, "3": 0.000838723889849154, "2": 0.00013691777428795986, "1": 0}, "score": 4.0339979939674215}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9731348455387194, "3": 0.019575380485033416, "2": 0.004949431289559973, "5": 0.0023379457962779595, "1": 1.0070533162488254e-06}, "score": 3.972860643852892}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9262591350669638, "5": 0.07369271731013496, "3": 3.950430123342724e-05, "2": 8.280551379973508e-06, "1": 0}, "score": 4.073636678619341}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9787818771118302, "2": 0.010538753569763871, "3": 0.008874520262599885, "5": 0.0018029681498553261, "1": 8.012674904460114e-07}, "score": 3.9718485065518214}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6369707326945249, "2": 0.3008836601733211, "3": 0.06112821716597243, "5": 0.0009281829501967051, "1": 8.238089538948923e-05}, "score": 3.3377809823645386}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6297582647354277, "5": 0.3702157630231656, "3": 2.124700741585813e-05, "2": 4.316591378124758e-06, "1": 0}, "score": 4.370186034106782}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.57744081308671, "4": 0.4224647236458936, "3": 7.3523939301019e-05, "2": 2.010032648492632e-05, "1": 0}, "score": 4.577327572873203}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8596606161552919, "4": 0.14033573782075623, "3": 2.6977512563493935e-06, "2": 6.508627802381667e-07, "1": 0}, "score": 4.859656872348952}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5698257309930257, "5": 0.4301270279858707, "3": 3.883553033797978e-05, "2": 7.647169336294898e-06, "1": 0}, "score": 4.430073224250602}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8266021052739448, "5": 0.17326521910644585, "3": 0.00011380125593468903, "2": 1.8577544342962383e-05, "1": 0}, "score": 4.1731143141455}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9791654125486806, "2": 0.011399569356965365, "5": 0.005301292077118468, "3": 0.004128650420950097, "1": 3.7064759925199306e-06}, "score": 3.978362353889719}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9701892474989087, "5": 0.028395798071224686, "3": 0.0010839548804847507, "2": 0.00033058756060810434, "1": 0}, "score": 4.026650679049305}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5621586913482444, "4": 0.43780962903240894, "3": 2.1491630020504335e-05, "2": 9.839585222239247e-06, "1": 0}, "score": 4.5621177163918984}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9322971263570164, "5": 0.06753538474592502, "3": 0.0001303739106749259, "2": 3.677365006883544e-05, "1": 0}, "score": 4.067331486517794}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.98740808107006, "5": 0.005871342300433702, "3": 0.0053459179997537715, "2": 0.0013729452900555666, "1": 1.1946336364054893e-06}, "score": 3.9977759486660296}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9139481571309219, "2": 0.07047612352013424, "3": 0.014772593580308713, "5": 0.000795247954090807, "1": 4.728720024544843e-06}, "score": 3.8450557332392985}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.971586315940227, "3": 0.016457889695539258, "2": 0.008809273548842313, "5": 0.0031410432155121832, "1": 2.449932707772864e-06}, "score": 3.969057162939553}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9494972053690545, "5": 0.05032150794140019, "3": 0.00016784862943283749, "2": 1.2742432397804557e-05, "1": 0}, "score": 4.050128209317743}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9655299957640883, "5": 0.03303862326276634, "3": 0.0009519928820872185, "2": 0.00047869208311702, "1": 1.4171426852673198e-07}, "score": 4.031128838326157}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9984735680840818, "1": 0.0010317199655050244, "3": 0.0004797943420200152, "4": 1.4042768390405268e-05, "5": 0}, "score": 1.9994761594550188}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.607645199988245, "4": 0.3923252358098967, "3": 2.5915637680695766e-05, "2": 3.507300165774394e-06, "1": 0}, "score": 4.607612355583992}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7710469286660526, "5": 0.2279210230878792, "3": 0.0009761629778399062, "2": 5.507134673623882e-05, "1": 2.9353880258331836e-07}, "score": 4.2268339548406235}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774782266889905, "5": 0.4224920960220572, "3": 2.834783209575432e-05, "2": 1.2071962932893654e-06, "1": 0}, "score": 4.422461385447742}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8127545918863955, "5": 0.18710674427241192, "3": 0.00011911144386868345, "2": 1.944440869347413e-05, "1": 0}, "score": 4.186948764199497}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9542846307013508, "2": 0.027930298825368256, "3": 0.014265396491437434, "5": 0.003495885756742891, "1": 2.212797307116694e-05}, "score": 3.933303396962185}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9869393418790343, "5": 0.005343379291694786, "3": 0.004096911015836453, "2": 0.003615511281640378, "1": 3.5095560849812807e-06}, "score": 3.994004908969081}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6218898760928837, "5": 0.3771952579554612, "3": 0.0005943053579902756, "2": 0.0003181088303269996, "1": 1.2600401152596892e-06}, "score": 4.3759614028584055}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9555573845639852, "2": 0.0312000525460453, "3": 0.010450713765345274, "5": 0.002769163472167906, "1": 1.752799922300322e-05}, "score": 3.92986539888711}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.979243139825675, "5": 0.01582799612940488, "2": 0.002882492234039667, "3": 0.002043993063985316, "1": 1.8065348411429993e-06}, "score": 4.008013603578297}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9855679628070603, "5": 0.01362583984953054, "3": 0.000678390620158142, "2": 0.0001274658592259055, "1": 0}, "score": 4.012692521837345}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9841949811343619, "5": 0.014944215157723857, "2": 0.0005034349750623604, "3": 0.00035698885327193724, "1": 1.8548236997158706e-07}, "score": 4.013579802547095}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9121207557977102, "5": 0.08753357893308966, "3": 0.0002576630073222366, "2": 8.766542307600874e-05, "1": 0}, "score": 4.087100614418482}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6076513980008946, "5": 0.3923292375477108, "3": 1.753557295447577e-05, "2": 1.79137155441563e-06, "1": 0}, "score": 4.392308133945904}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8804933795857833, "5": 0.11916182925553206, "3": 0.00030474871688418274, "2": 3.935458781244439e-05, "1": 0}, "score": 4.118778453065255}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6114230743812367, "5": 0.38261879452962017, "3": 0.004595897597644723, "2": 0.0013585447349159945, "1": 2.9257315675157245e-06}, "score": 4.375297316628682}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8157293728055236, "5": 0.17098617050324585, "2": 0.008646960561156176, "3": 0.004628384462311824, "1": 7.885010546583072e-06}, "score": 4.1490403927084545}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5144188613663933, "5": 0.4832517981252243, "3": 0.0014224952943262723, "2": 0.0009041930224093511, "1": 1.6397479778165616e-06}, "score": 4.480016483531795}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.793092205366533, "4": 0.206890460936224, "3": 1.2443464657306627e-05, "2": 4.649783028459459e-06, "1": 0}, "score": 4.793070653029306}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.603705731059822, "5": 0.38978171565484737, "2": 0.00530533160955423, "3": 0.0012024213061462396, "1": 3.0274405450830707e-06}, "score": 4.377960218904623}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9908571434289394, "3": 0.006174607260680427, "1": 0.002573959253408825, "4": 0.0003886097232903777, "5": 0}, "score": 2.0043778923217417}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.531181217535606, "5": 0.4687657791862865, "3": 4.0386014850243596e-05, "2": 1.1938083186874117e-05, "1": 0}, "score": 4.468701835338008}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5077723610517344, "4": 0.49214984787986255, "3": 6.775603667227681e-05, "2": 9.609849460356835e-06, "1": 0}, "score": 4.507685601175059}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.4999723110466791, "5": 0.4999723110466791, "3": 3.983745531114694e-05, "2": 1.488616946358388e-05, "1": 0}, "score": 4.499903028329928}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6369874215463445, "5": 0.3629445177728587, "3": 4.409650633844958e-05, "2": 2.360315897541523e-05, "1": 0}, "score": 4.362853345944245}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt4", "target_model": "human", "scores": {"2": 0.7729687330874861, "4": 0.17794752064453764, "3": 0.04715139895666426, "1": 0.001180411703600656, "5": 0.0007386827688634046}, "score": 2.404087432154348}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8668975198958762, "2": 0.07005606702696572, "3": 0.04967719024607016, "1": 0.010412901633376796, "5": 0.0028467288950524898}, "score": 3.7817947860830747}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5467199073939256, "4": 0.4532467227184563, "3": 2.5211911413089347e-05, "2": 7.569988573206546e-06, "1": 0}, "score": 4.5466798769463725}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7185802418635667, "4": 0.28140003779254263, "3": 1.4252146942022704e-05, "2": 5.2430718525245935e-06, "1": 0}, "score": 4.718555665337832}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9746148360323049, "5": 0.020227484106901047, "2": 0.004306679885120827, "3": 0.000848035550747348, "1": 0}, "score": 4.010766120701269}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9616661720893656, "5": 0.013717429890463883, "3": 0.012686548754572017, "2": 0.011917909622064985, "1": 1.08677268514697e-05}, "score": 3.97716243423124}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6076144174621415, "5": 0.3923053454246667, "3": 7.38230163735786e-05, "2": 6.155189566627114e-06, "1": 6.323929327197814e-08}, "score": 4.39221909905599}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7876148638984973, "5": 0.21198367754213396, "3": 0.0003555406390729639, "2": 4.520191973566555e-05, "1": 2.77312446702562e-07}, "score": 4.211536993925014}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5850805552196815, "5": 0.4148842389301818, "3": 2.963273190463776e-05, "2": 5.230487876565504e-06, "1": 0}, "score": 4.41484428736077}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9719593824477692, "3": 0.016464209092323975, "2": 0.008278724237936779, "5": 0.0032419949932816373, "1": 4.92271134439073e-05}, "score": 3.9700724626895583}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.939840812935525, "2": 0.030211129379169227, "5": 0.016946912756575446, "3": 0.01299364873175825, "1": 4.568068911588849e-06}, "score": 3.943517135670684}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9042791879881386, "5": 0.09531031852965964, "3": 0.00027620505919871913, "2": 0.00013252463570125658, "1": 0}, "score": 4.094769231351826}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.825970021254953, "5": 0.17313272190047246, "3": 0.0006965841177236097, "2": 0.00019957489071922851, "1": 0}, "score": 4.17203717686994}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7122208237066328, "4": 0.2877632170581733, "3": 1.189530230586168e-05, "2": 3.4080611707314515e-06, "1": 0}, "score": 4.712202579395515}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9147563942006084, "5": 0.07747131811200349, "2": 0.005355011112077914, "3": 0.0024136926118969917, "1": 1.8246962922205216e-06}, "score": 4.064342242382266}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9265200063683541, "5": 0.052270678796076914, "3": 0.01670671240327382, "2": 0.004496550642609717, "1": 3.6755050726796516e-06}, "score": 4.026559901706252}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9715152091115002, "5": 0.02432141113316094, "3": 0.0029505219266250052, "2": 0.0012108917588896104, "1": 8.466122832896352e-07}, "score": 4.018946587061806}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7566699787361796, "5": 0.23809676793094403, "3": 0.004161194943177736, "2": 0.0010686832455159346, "1": 1.9080037872658037e-06}, "score": 4.231792822557987}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8740643578968638, "4": 0.1259208933190672, "3": 1.191482660719434e-05, "2": 2.2739844518872604e-06, "1": 0}, "score": 4.874048384544857}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9514712958149777, "5": 0.047370964559961766, "3": 0.0007538097068440263, "2": 0.00040348526051681475, "1": 1.6845098831485804e-07}, "score": 4.045809691632063}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9098152427769903, "5": 0.09008391087122922, "3": 8.343947827398651e-05, "2": 1.668894556395878e-05, "1": 0}, "score": 4.089967158091763}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9904759725874495, "5": 0.007681468032686645, "3": 0.0013348389915284911, "2": 0.000506647734301705, "1": 0}, "score": 4.005333339293382}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.736474622915227, "5": 0.2625981137807639, "3": 0.0007975185208010129, "2": 0.00012618569072286897, "1": 1.1263750522539007e-06}, "score": 4.261545481019611}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6859311779342622, "5": 0.31404220226098173, "3": 2.1740079922283044e-05, "2": 4.416765133814963e-06, "1": 0}, "score": 4.314011774025588}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.982533778182674, "5": 0.012760885588325726, "3": 0.0031764355725224258, "2": 0.0015240704435257463, "1": 3.8372868138048795e-06}, "score": 4.0065248037469585}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7802501465553452, "2": 0.17409734189770343, "3": 0.04471189076937649, "5": 0.0008994150053798952, "1": 3.830174888601325e-05}, "score": 3.6078767964590153}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9352607795234387, "5": 0.06364529987429055, "3": 0.0007409666058596246, "2": 0.00035000784130612107, "1": 6.152082552734499e-07}, "score": 4.062202616952047}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5543561437641443, "4": 0.44543767537770823, "3": 0.0001888942921812272, "2": 1.6505399304668844e-05, "1": 0}, "score": 4.554134671544886}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8175584093638096, "4": 0.18242192604250712, "3": 1.5472705837187374e-05, "2": 3.732964006706336e-06, "1": 0}, "score": 4.817535845916646}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7120018067522472, "5": 0.2876747434724388, "3": 0.00021747536026300485, "2": 0.00010434581819921966, "1": 4.832170042646207e-07}, "score": 4.287247455832212}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt4", "target_model": "human", "scores": {"4": 0.963169191989354, "5": 0.035083438411152794, "3": 0.0012980385001598784, "2": 0.0004485901021441396, "1": 0}, "score": 4.0328882440768}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9124319697530893, "4": 0.08756344172967415, "3": 4.037979963791023e-06, "2": 4.255999569799189e-07, "1": 0}, "score": 4.912427194569417}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8257717131432739, "5": 0.1730911577239232, "3": 0.0010454456762858022, "2": 9.135002513406601e-05, "1": 0}, "score": 4.17186306930191}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8670291422685482, "4": 0.13296321074022596, "3": 6.9479910342052535e-06, "2": 5.357715389720107e-07, "1": 0}, "score": 4.867021264257149}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5544092480825462, "5": 0.4454803458963045, "3": 0.00010111753548947943, "2": 8.974691477022618e-06, "1": 0}, "score": 4.445361418729683}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9771908266743616, "2": 0.01309436884959966, "3": 0.007008910575991281, "5": 0.0027021757422930675, "1": 3.114870436527499e-06}, "score": 3.969495164452612}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.5252532456647815, "4": 0.43545023507486696, "3": 0.03864841167025475, "5": 0.0005343285745940565, "1": 0.00011026488956636241}, "score": 2.9110448041803805}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9684119984711473, "5": 0.02349782066011247, "3": 0.00603473702718063, "2": 0.0020532158657087466, "1": 1.5766266894161668e-06}, "score": 4.013351930718215}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8806669771615857, "5": 0.11918531836685424, "3": 0.00011936482480880545, "2": 2.7912079663189073e-05, "1": 0}, "score": 4.119010180267556}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8867093694503305, "5": 0.11273244625916555, "3": 0.00041948281429995103, "2": 0.00013833075017635158, "1": 2.431437511487899e-07}, "score": 4.112035586807015}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9554735829895653, "5": 0.04198057784145039, "3": 0.0016025278343357707, "2": 0.0009420775141404313, "1": 4.4567627022390953e-07}, "score": 4.038492588287735}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.977508306950154, "5": 0.022281500918758957, "3": 0.0001648871924503471, "2": 4.507764998642994e-05, "1": 0}, "score": 4.0220264634327005}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8869829579422764, "5": 0.1127672183071661, "3": 0.0001951379136297848, "2": 5.4187841567838117e-05, "1": 0}, "score": 4.112463760716831}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7310500381013694, "4": 0.26893827141694515, "3": 9.658733751085185e-06, "2": 1.7048677776522637e-06, "1": 0}, "score": 4.73103720859362}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9776859246144377, "2": 0.011928592854459746, "3": 0.007122888126940256, "5": 0.003261095816680174, "1": 9.069377699908891e-07}, "score": 3.9722782847659657}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt4", "target_model": "human", "scores": {"2": 0.599251411635498, "4": 0.33093807688625587, "3": 0.06936838935724475, "5": 0.0003262981578344993, "1": 0.00011276562593050503}, "score": 2.7321129110255065}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9164949241642846, "5": 0.08262452745330122, "2": 0.0005148815416355404, "3": 0.00036510568439666045, "1": 0}, "score": 4.0812297042682015}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9769776728148724, "5": 0.0184619836318598, "2": 0.0029211099940099836, "3": 0.001638594199786664, "1": 4.55706443040463e-07}, "score": 4.0109798043412}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6926360348471532, "4": 0.30735535274022013, "3": 5.55048636895291e-06, "2": 2.879554394267842e-06, "1": 0}, "score": 4.69262485156728}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9962538630442854, "5": 0.0025478561472225283, "2": 0.0007186558253768189, "3": 0.0004787279863696093, "1": 0}, "score": 4.000631817076837}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6934520872042835, "2": 0.21820438708234924, "3": 0.0854500657470102, "5": 0.002704203134276747, "1": 0.00018402314872140136}, "score": 3.4802905737818284}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8408642979462099, "5": 0.14612030349959987, "3": 0.009053761248881574, "2": 0.003955295361579099, "1": 4.704105123193437e-06}, "score": 4.129142050726027}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9701653471811899, "3": 0.012404900287005772, "5": 0.009660946057442788, "2": 0.007762788240347615, "1": 3.970815772965564e-06}, "score": 3.981718519412586}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.748799321451791, "5": 0.2508163703062625, "3": 0.0002802271594381755, "2": 0.00010308981081517669, "1": 0}, "score": 4.2503302116704464}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9588175140052838, "5": 0.034924929236402655, "3": 0.0032485234790853726, "2": 0.0030043930843370835, "1": 2.6553635030646484e-06}, "score": 4.025659704428321}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9881592450715776, "5": 0.009995089066139424, "3": 0.0011752358830523415, "2": 0.0006696292211707039, "1": 3.268429685148708e-07}, "score": 4.007479617756545}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9304432439292888, "5": 0.06532736922232969, "3": 0.0031035179137968443, "2": 0.001124019701094612, "1": 1.217185903595426e-06}, "score": 4.059972198253916}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9162176530805887, "5": 0.08005820871098157, "3": 0.002962041655303303, "2": 0.0007607152110796263, "1": 7.384207890273792e-07}, "score": 4.075572569958363}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9194832330131455, "5": 0.08034355512775414, "3": 0.00014799708209038814, "2": 2.4926775773004746e-05, "1": 0}, "score": 4.080145727576187}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9849878558227615, "5": 0.00623469386808123, "2": 0.004490681531472775, "3": 0.0042850382520760455, "1": 9.281003260834108e-07}, "score": 3.992965502607423}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9925703113102871, "5": 0.0037515645975539596, "3": 0.0022754389503089633, "2": 0.0014018572701641335, "1": 2.5171760320598525e-07}, "score": 3.9986716551887755}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9730861890397545, "2": 0.01838844685291907, "3": 0.00828832235530672, "5": 0.00023147631515907802, "1": 3.7414661673623364e-06}, "score": 3.955154954059463}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9738975584503529, "3": 0.01728875480671154, "5": 0.005612836905552431, "2": 0.003198098066799637, "1": 1.768818054946883e-06}, "score": 3.981922561741813}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8031560581659196, "5": 0.1968218645853257, "3": 2.0136912184103915e-05, "2": 1.552791933367206e-06, "1": 0}, "score": 4.196798698357555}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9894371390019544, "3": 0.006165759219430416, "2": 0.004107281109159696, "5": 0.00027950398719910844, "1": 6.781962795818975e-06}, "score": 3.985878786746534}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5549180132621097, "2": 0.3582819975509746, "3": 0.08248119095987098, "5": 0.0036810398455139706, "1": 0.0006297516642623954}, "score": 3.2027402153572218}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9140536282638176, "5": 0.08240443670573663, "2": 0.0018783416358827455, "3": 0.0016576306756622048, "1": 4.045153743072368e-06}, "score": 4.0769781349076695}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9236700221572685, "2": 0.04671101382670814, "3": 0.020727886736761868, "5": 0.008776737706540706, "1": 0.00010876999965830073}, "score": 3.8942999246130956}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9563349511340425, "5": 0.02843109040577588, "2": 0.008145643781220515, "3": 0.00707705796007818, "1": 8.157914480696399e-06}, "score": 4.005038286752479}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9712986659920987, "5": 0.027553624258575923, "3": 0.0006790971245911066, "2": 0.0004667361729892446, "1": 8.203817961397773e-07}, "score": 4.025938621035616}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9011007927350948, "5": 0.09799017112345824, "3": 0.0006106336313474905, "2": 0.0002975991830907094, "1": 0}, "score": 4.096784416875465}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.615048753705362, "5": 0.38488769059155536, "3": 3.99981241979978e-05, "2": 2.3149138313588706e-05, "1": 0}, "score": 4.3848015513592955}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.5695425410148497, "5": 0.42991326497545707, "3": 0.00033012242085799594, "2": 0.00021314305456777348, "1": 0}, "score": 4.429157254932682}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8031612867288772, "4": 0.19682312424928994, "3": 9.219405517215222e-06, "2": 6.0462337525945615e-06, "1": 0}, "score": 4.803140234577402}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7981743353831489, "4": 0.20181008441240073, "3": 8.742590642787526e-06, "2": 6.3962159517460215e-06, "1": 0}, "score": 4.7981531526636925}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9833041467775967, "5": 0.014246961828734245, "3": 0.0013460423293500004, "2": 0.0010986077309366525, "1": 0}, "score": 4.010703749435681}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9834518157318743, "2": 0.007869101427572758, "3": 0.006033449351698891, "5": 0.0026358188137604157, "1": 3.7813253049760534e-06}, "score": 3.980852707108685}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9490048061013965, "5": 0.05029540791401273, "3": 0.000567530253441824, "2": 0.0001306529482808586, "1": 0}, "score": 4.04946665104831}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8737829457441727, "5": 0.12588037849478204, "3": 0.00026689025874247936, "2": 6.748042514467269e-05, "1": 0}, "score": 4.1254788166241045}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9676979292163796, "5": 0.03209403152290175, "3": 0.00016323249887427875, "2": 4.393343106595274e-05, "1": 0}, "score": 4.031842959971333}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9437040833561259, "5": 0.03229177904111095, "2": 0.013673194071224736, "3": 0.010321068370641734, "1": 7.445192767157239e-06}, "score": 3.994601973832687}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6924353518553382, "5": 0.3072663247908524, "3": 0.00025116134916440834, "2": 4.64601779710395e-05, "1": 0}, "score": 4.306922458492114}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6076327433893257, "4": 0.3923171932249994, "3": 4.0770205527515015e-05, "2": 8.817175300096828e-06, "1": 0}, "score": 4.607574628041666}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6223815312498364, "5": 0.37749347319205273, "3": 0.00010831661492294363, "2": 1.5604487887282337e-05, "1": 0}, "score": 4.37735435305174}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9566132497057596, "5": 0.027998453569300124, "3": 0.008406660253336381, "2": 0.006969366136665681, "1": 1.0478018200073864e-05}, "score": 4.005621637063787}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9885896505088063, "3": 0.007430954223745362, "1": 0.0030023769120635048, "4": 0.0009747290724411599, "5": 9.915702889215004e-07}, "score": 2.0063810184481596}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8080024324561831, "4": 0.19191740150728917, "3": 6.240032963441747e-05, "2": 1.6534441317095675e-05, "1": 0}, "score": 4.807907957993172}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6145461383772937, "5": 0.3845731580979553, "2": 0.0004945455984150071, "3": 0.0003851524993101241, "1": 6.163986029312609e-07}, "score": 4.383197214280615}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7057400785293448, "4": 0.294196255097549, "3": 5.200696011366626e-05, "2": 1.1247293905297329e-05, "1": 0}, "score": 4.705665867799794}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8984416863299268, "5": 0.10080235102057952, "3": 0.0005543477835722782, "2": 0.00020077132181355668, "1": 2.502403452287058e-07}, "score": 4.099845769111215}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt4", "target_model": "human", "scores": {"5": 0.8633491695644938, "4": 0.13660168454047483, "3": 3.5135062305657414e-05, "2": 1.3545773203544592e-05, "1": 2.520064889411598e-07}, "score": 4.863286370862094}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.9172947589907178, "4": 0.08269663227254358, "3": 5.052123035259059e-06, "2": 3.2618957930474207e-06, "1": 0}, "score": 4.917283453415959}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6075873670704223, "4": 0.39228788822522087, "3": 8.766305614153951e-05, "2": 3.654339863435263e-05, "1": 3.016842187215038e-07}, "score": 4.607425855860273}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5621583540531307, "5": 0.4378093663467103, "3": 2.67467657091871e-05, "2": 5.185097044834388e-06, "1": 0}, "score": 4.4377724016167495}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7121474260107897, "5": 0.2877335501998474, "3": 8.386141022020542e-05, "2": 3.4416653409067776e-05, "1": 2.318975865561928e-07}, "score": 4.287580307556906}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9216578912379065, "5": 0.07565429997347037, "3": 0.0022491430544546646, "2": 0.00043601626947578734, "1": 1.647987024485168e-06}, "score": 4.072528253054416}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9528189618053076, "5": 0.045978549797443806, "3": 0.0007431740408226981, "2": 0.0004578562443888442, "1": 8.838707459393132e-07}, "score": 4.044317037104278}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9400093123611296, "5": 0.05471509761776043, "3": 0.00456201758709107, "2": 0.0007106252796021934, "1": 1.0194564141787936e-06}, "score": 4.048728865036758}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6992414320723644, "4": 0.3007399924478061, "3": 1.5471529956227788e-05, "2": 2.565431159744562e-06, "1": 0}, "score": 4.699221206223792}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9527548992704831, "3": 0.028770707791521737, "2": 0.018004248880940522, "5": 0.0003915988828873744, "1": 6.912127413308418e-05}, "score": 3.935404420764804}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9560939621430982, "3": 0.0337542480984772, "4": 0.009823046210343514, "1": 0.00032073382000388843, "5": 6.976075839002828e-06}, "score": 2.0531005898142207}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9804372238751883, "2": 0.011237408742705216, "3": 0.005391767638773326, "5": 0.0029314532182064352, "1": 1.5962059913551326e-06}, "score": 3.9750600657511255}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9426059426333693, "3": 0.035424308985625735, "2": 0.019871236397919274, "5": 0.0020944129074261858, "1": 2.822586203070378e-06}, "score": 3.9269190700803156}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9679439115480007, "5": 0.03015721744137342, "3": 0.0016749762381246009, "2": 0.0002231690504344058, "1": 2.960963289272453e-07}, "score": 4.028035026857962}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9402159199698401, "5": 0.0582567274792002, "3": 0.0011903349986559873, "2": 0.00033574940322536167, "1": 4.668440850556636e-07}, "score": 4.056393538330263}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9291289877542249, "2": 0.04345593686047278, "3": 0.026357358052413096, "5": 0.0010544267760013593, "1": 0}, "score": 3.8877848257522283}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9627324418020348, "2": 0.023360007499077712, "3": 0.00900608697228738, "5": 0.00489652455504654, "1": 3.216055337054618e-06}, "score": 3.9491606868165476}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.882745024988301, "2": 0.0847144576031111, "3": 0.02427109846670053, "5": 0.008257827835032311, "1": 9.083109209600177e-06}, "score": 3.814530099676408}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9190646600143111, "5": 0.08030698303337352, "3": 0.00043478943566978973, "2": 0.00019293658464915602, "1": 0}, "score": 4.079486370578899}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8652669819669453, "5": 0.13269298535076257, "2": 0.0011302211018995876, "3": 0.0009081581686360428, "1": 7.423336735872048e-07}, "score": 4.129522275982212}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.98537070042614, "2": 0.006536443949506778, "3": 0.004422779209775333, "5": 0.0036666127481866525, "1": 2.334151771183528e-06}, "score": 3.9861639275560377}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9345162306177994, "5": 0.06359462021679825, "3": 0.0011114375627522012, "2": 0.0007759084667169394, "1": 8.534524568608343e-07}, "score": 4.060928863226376}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9849469215630607, "5": 0.009506374551291535, "2": 0.0033896022325672986, "3": 0.002154562267906903, "1": 1.6288000172493302e-06}, "score": 4.000567721935158}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7430428457837562, "5": 0.25678872856768314, "2": 9.314277751440442e-05, "3": 7.484232430892181e-05, "1": 0}, "score": 4.256527713700793}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5466996572635905, "5": 0.45322993477076146, "3": 4.565118467502011e-05, "2": 2.4056483825826074e-05, "1": 0}, "score": 4.453136487948624}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9376741766194664, "2": 0.031588005602031295, "5": 0.01690783762104128, "3": 0.01379977487993812, "1": 2.7059348814932694e-05}, "score": 3.9398506842651364}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8517314767180926, "5": 0.14800873302991188, "3": 0.0002482413747132732, "2": 1.0906964803360493e-05, "1": 0}, "score": 4.147738772560954}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7604754417850893, "5": 0.23929420519759032, "3": 0.00020180957564621427, "2": 2.7742056805220294e-05, "1": 0}, "score": 4.239037103069051}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6222519089006806, "5": 0.3774148494905296, "3": 0.00027225130575529645, "2": 5.887847405882385e-05, "1": 0}, "score": 4.3770256374503225}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7307960423474473, "5": 0.26884485848822004, "3": 0.00031974204392131085, "2": 3.818774138518999e-05, "1": 0}, "score": 4.268449054880223}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt4", "target_model": "human", "scores": {"5": 0.636890880679395, "4": 0.36288946326550253, "3": 0.0001856250089856071, "2": 3.328073023814635e-05, "1": 0}, "score": 4.636639171890413}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.607455498468743, "4": 0.392202731768755, "3": 0.0002536066787456884, "2": 8.764412296626948e-05, "1": 0}, "score": 4.607026918567234}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7717878055626549, "4": 0.22814004639966207, "3": 4.864697159927543e-05, "2": 2.3341072056631064e-05, "1": 5.2679102344205785e-08}, "score": 4.771692401223749}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7826362737291014, "4": 0.21733022673279773, "3": 2.724302589689406e-05, "2": 5.891717540542733e-06, "1": 0}, "score": 4.782597532755527}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7715722984759281, "5": 0.22807633578230455, "3": 0.00022487856782614594, "2": 0.00012614544390723663, "1": 0}, "score": 4.227599244104161}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7684152514219712, "2": 0.17689923540737307, "3": 0.05229131933423974, "5": 0.0022975199969168815, "1": 9.48299756352021e-05}, "score": 3.595922494857116}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7431130666505664, "4": 0.25681299624916265, "3": 6.402211419442093e-05, "2": 9.516037735997055e-06, "1": 0}, "score": 4.743030308891609}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9289100531570086, "5": 0.06942603761917435, "3": 0.0013749082188757801, "2": 0.000288196217226575, "1": 2.213005731432681e-07}, "score": 4.067474112434404}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7981839853691977, "4": 0.20181250614794408, "3": 2.708363445878982e-06, "2": 6.741649655318436e-07, "1": 0}, "score": 4.798180029210145}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9492828444950158, "5": 0.050310151658662546, "3": 0.00028545561644214407, "2": 0.0001208695129061113, "1": 0}, "score": 4.049782990804968}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9369535041625078, "5": 0.0392816928275542, "3": 0.01637504580848503, "2": 0.007380811404531041, "1": 5.667587589422414e-06}, "score": 4.008128048092681}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8740737366577409, "4": 0.1259222532720588, "3": 3.157152639552151e-06, "2": 6.93534396505301e-07, "1": 0}, "score": 4.874069331748244}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7371124060774212, "4": 0.2628255433965695, "3": 4.793618072239321e-05, "2": 1.3733945720122628e-05, "1": 0}, "score": 4.7370372823739215}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8807932033979086, "4": 0.11920239884676337, "3": 2.596601716405769e-06, "2": 1.3470992243964717e-06, "1": 0}, "score": 4.880788312523541}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.8807933883645007, "4": 0.11920243460748838, "3": 3.181422926784926e-06, "2": 8.170569812715688e-07, "1": 0}, "score": 4.880788730090768}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9775380422275995, "5": 0.020932171443665687, "3": 0.0011268343926717083, "2": 0.00040178517609688744, "1": 6.040595809014568e-07}, "score": 4.0189999652113455}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8594482718265283, "5": 0.14030106514392637, "3": 0.00024278385404039322, "2": 7.564161925552401e-06, "1": 0}, "score": 4.140043197081543}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9580911494247584, "3": 0.025532265830056997, "2": 0.008823714963204773, "5": 0.007547323363269788, "1": 4.730110472617912e-06}, "score": 3.9643534081767795}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9397227885586696, "5": 0.06007447118370573, "3": 0.00018532120410501274, "2": 1.6970313586744152e-05, "1": 0}, "score": 4.059855236211862}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8667864427645404, "5": 0.13292599954548945, "3": 0.00026064870893862627, "2": 2.621412946515573e-05, "1": 1.6335550480795823e-07}, "score": 4.132612502994129}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt4", "target_model": "human", "scores": {"5": 0.9283956315000721, "4": 0.07159017751292586, "3": 1.2266090164759467e-05, "2": 1.5840162591655585e-06, "1": 0}, "score": 4.928380513844275}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8840276840820123, "4": 0.11595918537559143, "3": 1.167988998150793e-05, "2": 1.193175878877515e-06, "1": 0}, "score": 4.884013845453096}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5385768399464191, "4": 0.46066918344416724, "3": 0.000660872253018407, "2": 9.22784427566464e-05, "1": 4.014431129096219e-07}, "score": 4.537730434729268}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8221814633139548, "4": 0.17780922021849407, "3": 7.947373986722181e-06, "2": 1.0263066261166848e-06, "1": 0}, "score": 4.822171745156452}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.9324509121274016, "4": 0.06754652224913153, "3": 2.351248721699014e-06, "2": 1.456857401275461e-07, "1": 0}, "score": 4.932448333556148}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt4", "target_model": "human", "scores": {"4": 0.823965836904098, "5": 0.17271262376570945, "3": 0.0021741306402005647, "2": 0.0011456863376830806, "1": 5.592042756745384e-07}, "score": 4.168245638531899}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7370848828140408, "4": 0.262815687623489, "3": 8.955326231734577e-05, "2": 9.587484576322156e-06, "1": 0}, "score": 4.736976367432826}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5307723335800254, "4": 0.46840494036197, "3": 0.0006411981643937826, "2": 0.00018085824686956683, "1": 0}, "score": 4.529769773680496}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5466983725209055, "5": 0.45322886968166626, "3": 4.8595335938825726e-05, "2": 2.368347524640614e-05, "1": 0}, "score": 4.453133124439767}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7489762162308465, "5": 0.2508755950424968, "3": 0.00011684374833928666, "2": 3.096051113037467e-05, "1": 0}, "score": 4.250696926656639}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9763548644764575, "5": 0.02090683792658801, "2": 0.0014006708199680563, "3": 0.001336529433242048, "1": 5.324350066773514e-07}, "score": 4.01676737902043}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.8031618087838833, "4": 0.19682326202552514, "3": 1.2406078547762662e-05, "2": 2.224287318382608e-06, "1": 0}, "score": 4.803145194130342}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9382365183516536, "5": 0.059979460521989346, "3": 0.0010160039927109056, "2": 0.0007669200494771423, "1": 3.984722409452592e-07}, "score": 4.057428461133808}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6583987553745084, "5": 0.34157274723750103, "3": 1.757215519396655e-05, "2": 1.0492813119114936e-05, "1": 0}, "score": 4.341534337142236}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8723317414312205, "5": 0.12567130136421145, "3": 0.0011217832189959584, "2": 0.0008736456493904138, "1": 5.828505674517112e-07}, "score": 4.122800594400927}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9799367080750672, "5": 0.017948163163647692, "3": 0.0019517721973084648, "2": 0.0001627341777056622, "1": 2.0283104400433726e-07}, "score": 4.015670320692362}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9207595515941905, "2": 0.050347505713598646, "3": 0.02780453338993152, "5": 0.001078098756325259, "1": 8.231378996673271e-06}, "score": 3.8725535948198515}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9777653560231392, "5": 0.01936359543032877, "3": 0.0027895898531353166, "2": 8.038073700303466e-05, "1": 4.5607389049498505e-07}, "score": 4.016411886087781}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9862831472577669, "5": 0.013635731710336909, "3": 7.26805316151748e-05, "2": 8.15452964858815e-06, "1": 0}, "score": 4.013546745993395}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9746743965647884, "3": 0.017851780996847554, "2": 0.006990857884567457, "5": 0.0004757338494122916, "1": 4.381357281317335e-06}, "score": 3.968629003624728}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5824887540969386, "4": 0.22810589639090798, "3": 0.18910643013670422, "1": 0.0001594835142524635, "5": 0.0001364134786984114}, "score": 2.645569930999624}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8879331680741416, "3": 0.062342693435625304, "2": 0.049317129693358955, "5": 0.0003765408565043532, "1": 2.5623952484369725e-05}, "score": 3.839321937854121}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8755121758874962, "5": 0.1222488814942866, "3": 0.0021034088256290297, "2": 0.00013446642746577626, "1": 3.082603866285155e-07}, "score": 4.119875706030783}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8665570434222004, "5": 0.13289083197888396, "3": 0.00051018987378179, "2": 4.1229645887171215e-05, "1": 0}, "score": 4.132298276094096}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9233504783787613, "5": 0.075793215167775, "3": 0.0007201894900176771, "2": 0.00013531962300601015, "1": 0}, "score": 4.07480244607476}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9468434821657347, "2": 0.03448877052354583, "3": 0.0170731760353698, "5": 0.0015880527481336626, "1": 4.530754844549846e-06}, "score": 3.9155235754812363}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.743107931757017, "5": 0.256811224245602, "3": 7.031404447078925e-05, "2": 9.368439666190922e-06, "1": 0}, "score": 4.2567224715083505}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7925561452490628, "5": 0.20675060889584268, "3": 0.0005370781195571876, "2": 0.00015387553447953288, "1": 6.288541393893477e-07}, "score": 4.205904235635084}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8872032142834958, "4": 0.11279524444301856, "3": 1.0403732655716339e-06, "2": 3.0276588102038617e-07, "1": 0}, "score": 4.887201744163599}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.992420117803751, "5": 0.006184346113923855, "3": 0.0007620609641741559, "2": 0.0006219760318318156, "1": 6.193668483775803e-06}, "score": 4.004159774149975}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5415426245185213, "2": 0.4351417234154509, "3": 0.02099788627281734, "5": 0.002213160487961021, "1": 0.000101906075228351}, "score": 3.110623708527371}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9725227922531576, "5": 0.014766981061194366, "2": 0.00655280812392325, "3": 0.006155793549723767, "1": 9.021482260068599e-07}, "score": 3.995502861568128}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9459309349952759, "5": 0.0501325089543213, "3": 0.0025352551401540257, "2": 0.0014001008629384523, "1": 2.76111518582909e-07}, "score": 4.044796265142607}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6513106771283337, "5": 0.3486214904218124, "3": 5.9731980155196265e-05, "2": 7.594069076512681e-06, "1": 0}, "score": 4.348546746807794}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7429709004282896, "5": 0.25676387262180494, "3": 0.00020662644675676007, "2": 5.8281665470216746e-05, "1": 0}, "score": 4.2564407646070865}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9412144965953875, "3": 0.03271376636221611, "2": 0.023933902752306235, "5": 0.002124255268317796, "1": 1.2435453645889854e-05}, "score": 3.9215052872764993}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9898968224819058, "3": 0.005886140848784848, "5": 0.002415667337070067, "2": 0.0017951715330856675, "1": 3.747093819132783e-06}, "score": 3.9929279248090848}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9738830844923955, "5": 0.025154612491187195, "3": 0.0007837158809836102, "2": 0.00017762446207185195, "1": 0}, "score": 4.024015670805307}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8594902740898894, "5": 0.1403079260337593, "3": 0.00015922918157517985, "2": 4.219153286767025e-05, "1": 0}, "score": 4.1400643668935215}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.857572307398736, "3": 0.09325666019556254, "2": 0.049142806558373726, "5": 1.8391002638141882e-05, "1": 7.090363140808978e-06}, "score": 3.8084543209073236}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt4", "target_model": "human", "scores": {"2": 0.6948758517147183, "4": 0.28075524596483753, "3": 0.022336749439027654, "1": 0.0015439714785374628, "5": 0.0004858321811361247}, "score": 2.5837621378202806}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9576915842047126, "5": 0.04207802693831513, "3": 0.00018593674922760117, "2": 4.416384897648662e-05, "1": 0}, "score": 4.04180377454144}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6368559418040631, "5": 0.3628695774677914, "3": 0.00022389418636858426, "2": 4.99575456607246e-05, "1": 0}, "score": 4.362545996230125}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5774719264359053, "5": 0.42248748665843366, "3": 3.755440035757899e-05, "2": 2.6367327551568527e-06, "1": 0}, "score": 4.422444825984631}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6513334082676215, "5": 0.3486336575241429, "3": 2.8660691733619003e-05, "2": 4.1939858473060635e-06, "1": 0}, "score": 4.348596636584834}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9704820880088645, "5": 0.018921389069569913, "3": 0.0067466276928442636, "2": 0.0038441125842366745, "1": 5.1806086945297475e-06}, "score": 4.004470997073869}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.5621707216729632, "4": 0.43781899825872056, "3": 9.537062823930752e-06, "2": 6.096840285278956e-07, "1": 0}, "score": 4.562160040190082}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.943781369279169, "3": 0.03229441738723358, "2": 0.02362710048822626, "5": 0.0002928104753642016, "1": 3.3560864830841618e-06}, "score": 3.9207340488441655}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6076482989866673, "5": 0.3923272170573402, "3": 1.9870308015216243e-05, "2": 4.433665009633829e-06, "1": 0}, "score": 4.392298550026364}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9848399611505411, "5": 0.01404798935287559, "3": 0.000986323661625087, "2": 0.0001253969816289145, "1": 0}, "score": 4.012810875940892}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.6321119085625805, "2": 0.2718679251267715, "3": 0.09543463653652147, "5": 0.0004217116800759513, "1": 0.0001457396131660578}, "score": 3.3608024503298304}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9614503628373967, "5": 0.03727947395177325, "3": 0.0007617155240501935, "2": 0.0005074119295196953, "1": 2.895502441702668e-07}, "score": 4.03550209240986}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8482287052206222, "5": 0.1474000441060518, "3": 0.0037481983291903524, "2": 0.0006215122107388473, "1": 6.422070997471235e-07}, "score": 4.142407022605095}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8774640264333546, "4": 0.12252142087483073, "3": 1.1961181819310292e-05, "2": 2.0145917269368417e-06, "1": 0}, "score": 4.877448542284176}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9674115610729949, "5": 0.02876038383723978, "3": 0.003434939384147213, "2": 0.0003914585198494371, "1": 5.443045021994755e-07}, "score": 4.024540921811019}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9687929188179442, "3": 0.017468965017647078, "2": 0.012582423489997994, "5": 0.00115220313475562, "1": 1.8730283471373605e-06}, "score": 3.95851270498739}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9902679667441691, "5": 0.008567494038868457, "3": 0.0009463434498415974, "2": 0.00021786063251602944, "1": 1.0971233861612218e-07}, "score": 4.007185101806661}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7101272852603809, "2": 0.20991323506469517, "3": 0.07967406929616432, "5": 0.0002657549272479213, "1": 1.672575183826161e-05}, "score": 3.5007135754869037}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7057274247231785, "5": 0.2941909596126167, "3": 7.566831842378576e-05, "2": 5.655392744318032e-06, "1": 0}, "score": 4.294104066373279}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8453032248655962, "2": 0.12177748414881995, "3": 0.032775965216080956, "5": 0.00012007007827625766, "1": 1.8703310830796134e-05}, "score": 3.7237317689539844}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9264152275133277, "3": 0.04612349988355876, "2": 0.02547181582078911, "5": 0.001964175528657229, "1": 2.434198307043478e-05}, "score": 3.904823928658223}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5850417130110018, "5": 0.41485669567986755, "3": 8.573949386064941e-05, "2": 1.5614321812012348e-05, "1": 0}, "score": 4.414739826040378}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.49989435144316274, "5": 0.49989435144316274, "3": 0.00017301919774480814, "2": 3.6837912947022776e-05, "1": 0}, "score": 4.499648375914675}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5698394639586243, "4": 0.4301373941721572, "3": 1.8060632291224546e-05, "2": 4.7113974284616e-06, "1": 0}, "score": 4.569812191270532}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.49998289057271184, "5": 0.49998289057271184, "3": 2.6955963633154017e-05, "2": 7.142619301041629e-06, "1": 0}, "score": 4.4999417094992875}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9573496057278554, "1": 0.04206300355747975, "3": 0.00047463631491593666, "4": 0.0001092674512394054, "5": 0}, "score": 1.958630023404937}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9825382654246855, "3": 0.008634486814606605, "5": 0.004550054809717832, "2": 0.004274380924766215, "1": 1.2654079470325861e-06}, "score": 3.987362990377108}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9895497745262564, "5": 0.009701206691736889, "3": 0.0006918578794199667, "2": 5.679109628899686e-05, "1": 0}, "score": 4.008895769909451}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8396734774805378, "5": 0.16025448436755568, "3": 7.011547725940084e-05, "2": 1.4326395156156303e-06, "1": 0}, "score": 4.160181582105867}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9942204581835863, "3": 0.004978277158048195, "2": 0.0006843463560560458, "5": 0.00011171651627696588, "1": 0}, "score": 3.9937647142114945}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9857074039268067, "3": 0.010286780033715382, "2": 0.0030886514724895574, "5": 0.000913003631345398, "1": 0}, "score": 3.984448855945341}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9845613814548823, "5": 0.009958697390748571, "3": 0.003606801177037976, "2": 0.0018711838005197059, "1": 9.133159127917351e-07}, "score": 4.002606791331317}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9265981894249882, "3": 0.044713254502841776, "2": 0.022134666047303665, "5": 0.006542994785849626, "1": 9.241004186713347e-06}, "score": 3.91753254875531}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.636981841560972, "5": 0.36294128758102495, "3": 5.93377714154985e-05, "2": 1.7000556145533793e-05, "1": 0}, "score": 4.362848141924999}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9842090670337303, "5": 0.011822012727335131, "3": 0.003083956279308679, "2": 0.0008835682673290409, "1": 5.53755823036954e-07}, "score": 4.006969264513576}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7627449470919186, "5": 0.2254669711879742, "2": 0.007024637967259333, "3": 0.004753107805680392, "1": 9.767431725581474e-06}, "score": 4.206635402628016}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6650299777626467, "5": 0.3343980597404488, "3": 0.0004103303463013394, "2": 0.00016068767240784397, "1": 3.3020637472455184e-07}, "score": 4.333665568391565}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9624562869571094, "5": 0.023353306474234205, "3": 0.008726493070283713, "2": 0.00546089982330882, "1": 1.0769355540221038e-06}, "score": 4.003701790120074}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9284003570458629, "4": 0.07159054978281681, "3": 6.565597771838677e-06, "2": 2.065957001340727e-06, "1": 0}, "score": 4.928390088094316}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6369687389792517, "4": 0.362933847360892, "3": 7.500843380625571e-05, "2": 2.1828698695782327e-05, "1": 1.0593819276694833e-07}, "score": 4.636850055028208}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9345872229051371, "3": 0.025696504705688728, "2": 0.025298117326243263, "5": 0.014414432750521186, "1": 2.3566368944340563e-06}, "score": 3.938114538966204}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.6287599076490583, "4": 0.3161603365280391, "3": 0.05494043393514029, "1": 0.00010441575332306342, "5": 2.5991136029817e-05}, "score": 2.687240791396547}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9874465601253114, "5": 0.011677013824274888, "3": 0.0008327658897631463, "2": 4.345072589275083e-05, "1": 0}, "score": 4.010757348735689}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8669107661911816, "5": 0.13294507579511242, "3": 0.00011935074059046339, "2": 2.462941740472836e-05, "1": 0}, "score": 4.132776489834769}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9872088007604053, "2": 0.0068629108849054335, "3": 0.005870158757131111, "5": 5.6656774073254714e-05, "1": 5.820997570715134e-07}, "score": 3.98045891254215}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9780908515660574, "5": 0.013735411499002453, "3": 0.005549607913142446, "2": 0.002621449158995354, "1": 1.519463873693303e-06}, "score": 4.002938350285906}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7547415546930187, "5": 0.24502870794896542, "3": 0.00017675340303366632, "2": 5.224820613778062e-05, "1": 0}, "score": 4.244747638206447}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9234246670298627, "5": 0.07579930918725081, "3": 0.00043007927749611657, "2": 0.00034557840794401134, "1": 1.3136436007394541e-07}, "score": 4.074677696530111}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5467112091493936, "4": 0.4532395116204623, "3": 3.904838655288117e-05, "2": 9.872978272857974e-06, "1": 0}, "score": 4.546652610434306}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8983842292276446, "5": 0.10079590995614349, "3": 0.0006791578385879204, "2": 0.00014015200140583012, "1": 1.8022982408509795e-07}, "score": 4.0998359444390875}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8206962858045534, "5": 0.1774880138415501, "3": 0.0016864959582444663, "2": 0.00012803242574416668, "1": 3.3782865765859623e-07}, "score": 4.175544585974824}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7248104547742418, "5": 0.2751070456905208, "3": 6.342864402815428e-05, "2": 1.9044732572629558e-05, "1": 0}, "score": 4.275005534775118}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8424260627111457, "5": 0.15583316486535892, "3": 0.0015762305660372634, "2": 0.00016355765497004981, "1": 2.8748504369288095e-07}, "score": 4.153929063779314}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6076289578491264, "4": 0.3923147216344676, "3": 4.61983719349848e-05, "2": 9.385768549650687e-06, "1": 0}, "score": 4.607564435335913}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6652702698937676, "5": 0.3345188995878369, "3": 0.00015825356018079955, "2": 5.218648524236093e-05, "1": 0}, "score": 4.334256403575263}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9183275717861418, "2": 0.05514986396070458, "3": 0.01818648942236924, "5": 0.008326381591067212, "1": 7.359077299487777e-06}, "score": 3.8798178064906312}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8349492620412038, "5": 0.1644112611872642, "3": 0.0004839596608849897, "2": 0.00015468264369330252, "1": 2.761670225761088e-07}, "score": 4.1636171990853965}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.711992743026938, "5": 0.2876710612592886, "3": 0.00020751394826468974, "2": 0.00012784563479315477, "1": 2.318472702394281e-07}, "score": 4.287207334054265}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8519431327321088, "4": 0.14804551777038452, "3": 7.267414276806564e-06, "2": 3.8899665474427855e-06, "1": 0}, "score": 4.8519282490543665}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7368253640700027, "5": 0.26272316650917477, "3": 0.0003223798658884935, "2": 0.00012823385099620466, "1": 3.033040709963147e-07}, "score": 4.262143553837146}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt4", "target_model": "human", "scores": {"4": 0.962914011968446, "5": 0.03193536380458897, "3": 0.0035830485165108156, "2": 0.0015653179698568696, "1": 1.0442976539418614e-06}, "score": 4.025218577056707}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9645161908466573, "5": 0.035132494764884566, "3": 0.0002442351664253054, "2": 0.00010669844215472813, "1": 0}, "score": 4.034674875917644}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5155546332780446, "4": 0.4843187570954062, "3": 0.0001016716555749408, "2": 2.4529428450149462e-05, "1": 0}, "score": 4.515404113330066}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.637026113337387, "4": 0.36296651287708065, "3": 5.606578037671559e-06, "2": 1.331679007830355e-06, "1": 0}, "score": 4.637018120840872}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7879289958290873, "4": 0.2120682122852512, "3": 1.8664506104350067e-06, "2": 7.309125609606948e-07, "1": 0}, "score": 4.7879258208226485}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.842432684206021, "5": 0.1558343647853481, "3": 0.00145778575592935, "2": 0.0002739099925185974, "1": 5.628734567816168e-07}, "score": 4.153827176931907}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9601817975509958, "5": 0.029915375499629, "3": 0.00792678538038808, "2": 0.001973132889856038, "1": 2.0388349830102193e-06}, "score": 4.018036223523283}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9649794222150456, "3": 0.021995913343333864, "5": 0.009313658503066686, "2": 0.003704717394245979, "1": 4.27052836287706e-06}, "score": 3.979895458214867}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5621431759824762, "4": 0.437797545653399, "3": 5.319091217430395e-05, "2": 5.694566974729505e-06, "1": 0}, "score": 4.562078816768675}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9946140793603622, "5": 0.005058674937682125, "3": 0.00022576272490798613, "2": 0.00010018160189449366, "1": 0}, "score": 4.004632555037677}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9658664034884136, "3": 0.02494754895217738, "4": 0.00809928089208297, "1": 0.0010791247317388254, "5": 6.122867655653648e-06}, "score": 2.0400854155000405}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.969062298132062, "5": 0.026644396850180423, "3": 0.0030843128052613702, "2": 0.0012078342489716548, "1": 4.381077290838239e-07}, "score": 4.021143116443783}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6790963239481994, "4": 0.3207823895225064, "3": 0.00011102646074178704, "2": 9.854158590000186e-06, "1": 0}, "score": 4.678965864769286}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.807816168967729, "5": 0.19187316964415985, "3": 0.000275259574011501, "2": 3.4995327688512074e-05, "1": 0}, "score": 4.1915279972683}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8416982010908918, "5": 0.15569852087916383, "3": 0.002022170782064046, "2": 0.0005793616291318713, "1": 1.1360434388182923e-06}, "score": 4.152514311677479}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9362239203243377, "2": 0.025342420189186053, "5": 0.021009604261998088, "3": 0.017417566727615366, "1": 5.4889367033934645e-06}, "score": 3.9528906832573045}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8301765748786182, "5": 0.16866061136588736, "3": 0.0009275241741952194, "2": 0.00023451476694821014, "1": 0}, "score": 4.167264187256488}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7966873665062546, "5": 0.1952366434555863, "3": 0.007111493506876271, "2": 0.0009624359879884323, "1": 1.2571440961022903e-06}, "score": 4.186196656130689}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6722396903408994, "5": 0.32762346584663987, "3": 0.00011699369658028818, "2": 1.9399456650371954e-05, "1": 0}, "score": 4.327467820813155}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8219984249886457, "5": 0.17776962651407405, "3": 0.00018084106615221123, "2": 5.021775040705995e-05, "1": 0}, "score": 4.1774885078552115}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt4", "target_model": "human", "scores": {"5": 0.6723001946356825, "4": 0.32765292052018724, "3": 4.2376143812609555e-05, "2": 4.195806432202141e-06, "1": 0}, "score": 4.672249637221808}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5620502051900652, "5": 0.4377251399274666, "3": 0.00016127267371295382, "2": 6.31552864552042e-05, "1": 0}, "score": 4.437437655945202}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8705842682816837, "4": 0.12940078894324966, "3": 1.2632774125449462e-05, "2": 2.161212826709276e-06, "1": 0}, "score": 4.870567442611994}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7310237865658503, "4": 0.26892861670630436, "3": 4.130363695541713e-05, "2": 5.6778665680766626e-06, "1": 0}, "score": 4.730971576907251}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6991973113300247, "4": 0.3007210163529847, "3": 7.266163713334387e-05, "2": 8.678195001954555e-06, "1": 0}, "score": 4.699107525745552}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7368629210159399, "5": 0.26273656573234405, "3": 0.0002322135814734296, "2": 0.00016725716831399244, "1": 3.894703880777566e-07}, "score": 4.2621688406076}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.893291976660503, "4": 0.10668851123452397, "3": 1.4688186892566224e-05, "2": 4.078762191560553e-06, "1": 0}, "score": 4.893269796574477}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6075040118019623, "4": 0.3922340700189697, "3": 0.0002273495174940733, "2": 3.379248896973874e-05, "1": 0}, "score": 4.607209548605947}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7309704822548327, "5": 0.2689090394156301, "3": 9.753912289328168e-05, "2": 2.210665198354167e-05, "1": 0}, "score": 4.268767510752414}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5774873451421799, "4": 0.42249876722492236, "3": 1.2192457928171253e-05, "2": 1.3467476773777858e-06, "1": 0}, "score": 4.577472660396133}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9945179778266184, "3": 0.00467805899378864, "4": 0.0007062812702666823, "1": 9.709001695018927e-05, "5": 2.6847796322919494e-07}, "score": 2.0059943388899173}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9692065033923606, "3": 0.01494837471157732, "2": 0.011283625217669567, "5": 0.0045589967072672336, "1": 1.2288853732963317e-06}, "score": 3.967039643008791}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9291253864572477, "5": 0.06944212549579924, "3": 0.0010061374363356072, "2": 0.00042602539533895115, "1": 0}, "score": 4.067583959248122}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7248553509242298, "4": 0.2751240478313052, "3": 1.5303821339488896e-05, "2": 5.206862973263768e-06, "1": 0}, "score": 4.724829699017632}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9919389707610655, "5": 0.007340531702107983, "3": 0.0005749548741418069, "2": 0.00014537135798398335, "1": 0}, "score": 4.006474835221168}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9855543098286391, "3": 0.007293286583920058, "2": 0.004423601923218331, "5": 0.002725302085355286, "1": 2.3345859637916273e-06}, "score": 3.9865777922603307}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8989054432180424, "5": 0.10085439862650769, "3": 0.00018006313834421618, "2": 5.937852078119457e-05, "1": 0}, "score": 4.100555650494355}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9788641109679801, "5": 0.019084810921737277, "3": 0.0014263845827181658, "2": 0.0006231412745227888, "1": 0}, "score": 4.016412169265813}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9723271034021671, "5": 0.027582796936307875, "3": 6.128729474770474e-05, "2": 2.8059368188229457e-05, "1": 0}, "score": 4.0274654115866}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.942706358137038, "5": 0.05661391363742447, "3": 0.0005637636243939697, "2": 0.00011453558468247905, "1": 0}, "score": 4.05582115861302}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7255737048639546, "2": 0.23555927468967916, "3": 0.037270889477462314, "5": 0.0011980707790788456, "1": 0.00039508181023081834}, "score": 3.491621872348524}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8868203587141039, "5": 0.1127465386957069, "3": 0.00038800668077382407, "2": 4.4218734553803535e-05, "1": 1.7791018369212114e-07}, "score": 4.112269639321467}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5616234901247816, "4": 0.4373928139004753, "3": 0.0009129783414950753, "2": 6.823533628161842e-05, "1": 1.102921488709618e-06}, "score": 4.5605715055848455}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.658406669375111, "4": 0.3415768802927475, "3": 1.4797423206819982e-05, "2": 1.2929844300134447e-06, "1": 0}, "score": 4.658389522953567}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.926026210186026, "2": 0.038221664141526016, "5": 0.025066379321454575, "3": 0.01061377068251153, "1": 7.040628663461725e-05}, "score": 3.9377979638772405}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5846957222338081, "5": 0.4146113514806931, "3": 0.0005675603333423663, "2": 0.00012467639718221683, "1": 3.238731209034736e-07}, "score": 4.413793618050442}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7771505106290855, "5": 0.2226573580838733, "3": 0.00015326057203206558, "2": 3.8750341085391695e-05, "1": 4.004063594032582e-08}, "score": 4.222426494576015}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9195911866814576, "5": 0.06872955283367053, "3": 0.006293732386948915, "2": 0.005383314588500146, "1": 1.3420315634258152e-06}, "score": 4.051665210200118}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5621348563250373, "4": 0.43779106629767073, "3": 4.8430101778131586e-05, "2": 2.5520870233762882e-05, "1": 0}, "score": 4.562035455527041}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9783588127797597, "2": 0.010210091347293428, "3": 0.010210091347293428, "5": 0.0012005161375931736, "1": 1.8807515638669087e-05}, "score": 3.970513769986206}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9585705668848531, "1": 0.0383476473444933, "3": 0.0027778945342596933, "4": 0.0003020820163928858, "5": 0}, "score": 1.9650343479619952}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9522677602217743, "5": 0.035787414416368304, "2": 0.007157933192108744, "3": 0.004768211461765661, "1": 1.4256694102130678e-05}, "score": 4.016660640194981}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8406082264974419, "5": 0.15549689739587555, "3": 0.0028928740212377066, "2": 0.0009997505101099176, "1": 1.5267336101872801e-06}, "score": 4.150600051314788}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7308370338470584, "5": 0.268859914221852, "3": 0.0002267439841685307, "2": 7.477222989540559e-05, "1": 0}, "score": 4.268484038093402}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7642819831646188, "2": 0.1349037928704803, "3": 0.0956611135587118, "5": 0.00506985328331466, "1": 7.94252682829086e-05}, "score": 3.639361496264488}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9498809433790485, "5": 0.045836777862676786, "3": 0.003646749704605791, "2": 0.0006337100769460942, "1": 8.407949698312363e-07}, "score": 4.040920125646589}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9662395414443896, "5": 0.029177905998335165, "3": 0.002432784725959151, "2": 0.002146924985314065, "1": 2.084005072614624e-06}, "score": 4.022445036318742}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.955744628132013, "3": 0.021447664943000905, "5": 0.011660890835405778, "2": 0.011126899766283211, "1": 1.7531452578994547e-05}, "score": 3.9679067554638627}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.592635523785873, "5": 0.4073120417287027, "3": 4.3672104528394076e-05, "2": 8.599547262378747e-06, "1": 0}, "score": 4.407251236843848}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7929212806938021, "5": 0.2068458808455695, "3": 0.0001539464104811077, "2": 7.862813271385394e-05, "1": 1.238857583043411e-07}, "score": 4.2065343354337354}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9838068134494328, "5": 0.01447870977400129, "3": 0.0011164782135953176, "2": 0.00059760772351936, "1": 1.8832888767729308e-07}, "score": 4.01216645359054}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9564886943342159, "5": 0.04335920313077087, "3": 0.000133756978212199, "2": 1.8102038531221383e-05, "1": 0}, "score": 4.043189252592867}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9374296068343774, "5": 0.05992787039604523, "3": 0.002435169293044633, "2": 0.00020623629158516646, "1": 3.35258822147621e-07}, "score": 4.057079267375135}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9694814820476514, "5": 0.030205114942066912, "3": 0.0002961208233300466, "2": 1.6969074799068614e-05, "1": 0}, "score": 4.029875065323385}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9754645011463811, "2": 0.013071234537393242, "3": 0.008844439699118417, "5": 0.002614411381288607, "1": 4.055380662325602e-06}, "score": 3.9676152924916552}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8899042378200738, "5": 0.10965770911755317, "3": 0.0003715260779143433, "2": 6.55782809443342e-05, "1": 0}, "score": 4.109155130033606}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9304659470214173, "5": 0.061370869163758814, "2": 0.004111593552298812, "3": 0.00404784920265259, "1": 2.383191505211557e-06}, "score": 4.049092749943485}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.49985321183095727, "5": 0.49985321183095727, "3": 0.00025172080533047893, "2": 4.1092291861497134e-05, "1": 0}, "score": 4.4995196876957575}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8031725150021511, "4": 0.19682589947490717, "3": 1.1360695681178695e-06, "2": 1.5617151164650023e-07, "1": 0}, "score": 4.8031713021451345}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8474245925740196, "5": 0.15193484520494305, "3": 0.00037660879060233784, "2": 0.0002629154658703517, "1": 4.078248679153103e-07}, "score": 4.1510312771788}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8346854764510642, "5": 0.1643593154365899, "3": 0.0008359428570723508, "2": 0.00011856194397507701, "1": 3.832991814866843e-07}, "score": 4.1632851510472495}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7661356010799921, "5": 0.23365818019130447, "3": 0.00017942172815182386, "2": 2.6668659059986913e-05, "1": 0}, "score": 4.233425451103203}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7710579315842303, "5": 0.22792428238181325, "3": 0.0009170334580044266, "2": 9.972272232424377e-05, "1": 2.5108055827626743e-07}, "score": 4.2268072268688455}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8960149776676402, "5": 0.1037212569189026, "3": 0.0002340916154998733, "2": 2.9300001228878734e-05, "1": 0}, "score": 4.103428603962218}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9193955607889598, "5": 0.08033589875178257, "3": 0.00021531381271184158, "2": 5.276491905017406e-05, "1": 0}, "score": 4.080015092046138}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7825801294167446, "5": 0.21731466644562858, "3": 7.404896458463608e-05, "2": 3.086820093185374e-05, "1": 0}, "score": 4.217178943403479}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7310232163675191, "5": 0.2689284284563385, "3": 3.3711045994321913e-05, "2": 1.4498940212528495e-05, "1": 0}, "score": 4.268865758566521}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9300348410890159, "5": 0.06951010787054952, "3": 0.00038828032193094356, "2": 6.64268643313619e-05, "1": 0}, "score": 4.068988997542111}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7185919404451305, "4": 0.28140465279100535, "3": 2.515694875824454e-06, "2": 8.559220739960107e-07, "1": 0}, "score": 4.718587738162248}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6001353895325682, "4": 0.39977635529416905, "3": 7.406259084769734e-05, "2": 1.3915948520282652e-05, "1": 0}, "score": 4.600033661034328}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9329572025313695, "5": 0.06348853122661746, "3": 0.0018874642828755066, "2": 0.0016656813833766891, "1": 5.415821899655045e-07}, "score": 4.058268113167282}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9570458581741244, "5": 0.04075592708228695, "3": 0.0014388602094900264, "2": 0.0007582260483190031, "1": 5.822278331059166e-07}, "score": 4.037798888740603}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9448230043639757, "5": 0.02898048229176979, "3": 0.0181355260359234, "2": 0.008047590895346396, "1": 1.136601267411255e-05}, "score": 3.9947156656978176}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6855726531259513, "5": 0.3138780325193391, "3": 0.00044330568146374845, "2": 0.00010529432857093969, "1": 1.7660045011451253e-07}, "score": 4.3132237768136585}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8162978160125377, "2": 0.11759885264326808, "3": 0.06494425450860478, "5": 0.000626820087683852, "1": 0.0005036640900957315}, "score": 3.6989652606389645}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9410640423075364, "2": 0.0322014434434551, "3": 0.022131706840280537, "5": 0.0045671344762867536, "1": 3.17499629358836e-05}, "score": 3.9179369689295203}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7817814446844826, "5": 0.21709287969221833, "3": 0.0006097692201523285, "2": 0.0005134771644416406, "1": 1.1956686372252859e-06}, "score": 4.215452834913439}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7637173110511466, "5": 0.2329206130493255, "3": 0.0023930597540897983, "2": 0.0009668835439610944, "1": 8.413080112245499e-07}, "score": 4.228591557462064}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6583670476539776, "5": 0.3415563179834856, "3": 6.52853432109546e-05, "2": 1.065753930820484e-05, "1": 0}, "score": 4.341469953681308}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9861782172444278, "5": 0.012609643507796166, "3": 0.0010350625699853027, "2": 0.0001689693872469032, "1": 3.3989533906833236e-06}, "score": 4.0112264981612835}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9030244269907124, "5": 0.062419303530233394, "3": 0.022256288079100586, "2": 0.012291092081435492, "1": 7.824458697258763e-06}, "score": 4.015557374478592}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.978503511007166, "3": 0.01021159948915896, "5": 0.005818394001953843, "2": 0.005465875330031016, "1": 3.33922802808525e-07}, "score": 3.9846740376972845}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9351626608506936, "5": 0.06363862383249827, "3": 0.0010612745367431114, "2": 0.00013705064896281783, "1": 9.001531629857739e-08}, "score": 4.0623029966499935}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8702424221488778, "5": 0.12934998322978636, "3": 0.00036331759095305726, "2": 4.407538916987908e-05, "1": 7.053844193945736e-08}, "score": 4.128898320144095}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9147134977053257, "3": 0.045540897982354916, "2": 0.036593139554892774, "5": 0.003147902251165769, "1": 3.252716710104833e-06}, "score": 3.884410815611389}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt4", "target_model": "human", "scores": {"5": 0.5077936422373303, "4": 0.49217047431221106, "3": 3.200702973729629e-05, "2": 3.5910892113168184e-06, "1": 0}, "score": 4.507754597907557}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7370521717128062, "5": 0.26280404514641004, "3": 0.0001344293198528819, "2": 9.148030021989871e-06, "1": 0}, "score": 4.2626513738177785}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9545048305614148, "5": 0.04193801014134703, "3": 0.002898860065871956, "2": 0.0006570090926010573, "1": 5.287172748700525e-07}, "score": 4.03772357446199}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7185875498617876, "4": 0.28140293622785884, "3": 8.510430747776357e-06, "2": 6.562539526322827e-07, "1": 0}, "score": 4.718577976431842}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.965613902035251, "5": 0.032529227047486696, "3": 0.001723985874878722, "2": 0.00011731874630817, "1": 0}, "score": 4.030571079558467}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt4", "target_model": "human", "scores": {"2": 0.9306675543071601, "3": 0.05589092810030849, "4": 0.012667343185101135, "1": 0.000760733088097141, "5": 4.891052707690896e-06}, "score": 2.0804802426680697}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9680040024032565, "5": 0.03111643944309489, "3": 0.0005788923625528167, "2": 0.00030032540134163456, "1": 1.9419675321466134e-07}, "score": 4.029936318064078}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8474976352473823, "5": 0.1519479425530873, "3": 0.00046147055909497644, "2": 9.229994613885542e-05, "1": 0}, "score": 4.151301970704346}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5234091014221118, "4": 0.476569410085446, "3": 1.607867014594641e-05, "2": 5.139051646974064e-06, "1": 0}, "score": 4.523382886365396}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.5621560492086041, "4": 0.43780757133198805, "3": 3.226266108446887e-05, "2": 3.79348665512885e-06, "1": 0}, "score": 4.562116381312994}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8823649791591808, "5": 0.115741097548694, "3": 0.001049412599918861, "2": 0.0008432267131485316, "1": 4.520265137932132e-07}, "score": 4.1130039694568765}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.914890777210989, "4": 0.08509809747484609, "3": 7.564267824560652e-06, "2": 3.304583876002109e-06, "1": 0}, "score": 4.914876838406982}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.6790893972010217, "4": 0.3207791175588203, "3": 0.000118185752202469, "2": 1.2652850907506585e-05, "1": 0}, "score": 4.678946344778865}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5698181808521099, "4": 0.43012132884050686, "3": 3.764019735633805e-05, "2": 2.1784474952859475e-05, "1": 0}, "score": 4.569737578837196}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8076595162910205, "5": 0.1918359498596847, "3": 0.0004067285696657074, "2": 9.660655131978657e-05, "1": 0}, "score": 4.191236237427671}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9407359448377022, "3": 0.028855118040829675, "2": 0.025464552294745067, "5": 0.0049365281426361094, "1": 5.690474052656482e-06}, "score": 3.9251350719170004}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9558598472242188, "5": 0.04070542105291463, "3": 0.002260839668421704, "2": 0.0011729081686163852, "1": 0}, "score": 4.036098800564358}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.890762055934068, "5": 0.09388564310857192, "2": 0.008332822872151925, "3": 0.007016940374783329, "1": 1.6178248437141005e-06}, "score": 4.070198268089328}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.531188340723494, "4": 0.4687720653775342, "3": 3.194838264058438e-05, "2": 7.588406013566717e-06, "1": 0}, "score": 4.531141245862472}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.880478226425114, "5": 0.11915977968969521, "3": 0.00030954254860178596, "2": 5.213547180942873e-05, "1": 0}, "score": 4.118746003705156}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt4", "target_model": "human", "scores": {"5": 0.7879259465497738, "4": 0.21206740642757566, "3": 5.659918868721854e-06, "2": 8.545199394695462e-07, "1": 0}, "score": 4.787918682056313}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9613059100044025, "5": 0.03845707479832358, "3": 0.000211488909120393, "2": 2.448161818931808e-05, "1": 0}, "score": 4.03819666255573}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.562165662159236, "5": 0.4378150579054678, "3": 1.5003785830601036e-05, "2": 3.793551144950148e-06, "1": 0}, "score": 4.437792678295358}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.7122115292855296, "4": 0.2877594761606674, "3": 2.518202781063251e-05, "2": 3.5715710105238927e-06, "1": 0}, "score": 4.712179375718866}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.7057592184598108, "5": 0.29420419850367213, "3": 2.272077167771388e-05, "2": 1.2945905466594167e-05, "1": 0}, "score": 4.2941558554735355}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5621554589450624, "2": 0.3863634199467599, "3": 0.049120599029089065, "5": 0.0021921948991569422, "1": 0.00016642313612990633}, "score": 3.1798439249550676}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8335593946516499, "5": 0.16413758006580184, "3": 0.0017951350914734293, "2": 0.000506341102590143, "1": 1.1790506231130387e-06}, "score": 4.161326285314112}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9524444346579719, "2": 0.027876436971038726, "3": 0.011803623716922272, "5": 0.007862908522175926, "1": 1.110518990398532e-05}, "score": 3.9402730062439812}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6653602870508075, "4": 0.3345641630569558, "3": 5.732337940046194e-05, "2": 1.7482642961427385e-05, "1": 0}, "score": 4.665268493258676}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6512903370134995, "4": 0.3486106136009906, "3": 8.827531921620282e-05, "2": 1.0379529591410876e-05, "1": 0}, "score": 4.651181559550126}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8258739004572571, "5": 0.17311258773573981, "2": 0.0005340274584541155, "3": 0.0004786991199423626, "1": 2.3365083361795168e-07}, "score": 4.171565227377955}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6992311742757971, "4": 0.30073557160241043, "3": 2.673200556868922e-05, "2": 6.058647303766297e-06, "1": 0}, "score": 4.6991926490296825}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.977665981980343, "5": 0.010692504468003315, "2": 0.0060924053992269436, "3": 0.005547198241723796, "1": 6.431023176115536e-07}, "score": 3.992958557200714}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6925746838644616, "4": 0.307328183727926, "3": 5.6935642896666346e-05, "2": 3.97474845749342e-05, "1": 0}, "score": 4.692438564351311}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9439117852797771, "5": 0.05494225249360052, "3": 0.0006916208895091674, "2": 0.00045357605306995, "1": 0}, "score": 4.0533435203208965}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5033626472336902, "4": 0.3920192238344932, "3": 0.1038747637684214, "1": 0.000368822780108255, "5": 0.000368822780108255}, "score": 2.8886559397569616}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9701024213870756, "3": 0.015197816693993046, "5": 0.011652570261493573, "2": 0.003039754571142238, "1": 5.098296977398443e-06}, "score": 3.9903599269881846}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9289828881339487, "5": 0.06835503866147462, "3": 0.002413228020787531, "2": 0.00024652676259740445, "1": 8.352456197178834e-07}, "score": 4.065446348447058}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7057208756030651, "5": 0.29418822364941455, "3": 8.31045586671829e-05, "2": 7.149014806878008e-06, "1": 0}, "score": 4.294091011389202}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9714612040821095, "5": 0.027558231609715777, "3": 0.0008721239497047454, "2": 0.00010580063887946883, "1": 6.593053870483526e-07}, "score": 4.026472580892766}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8173104324597835, "5": 0.18236660586206785, "3": 0.00022030755733518483, "2": 0.00010245252883318077, "1": 0}, "score": 4.181941429924999}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8174870232802658, "5": 0.18240601954408964, "3": 8.234070332020164e-05, "2": 2.43398654100272e-05, "1": 0}, "score": 4.182275049528488}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.6363666169343802, "5": 0.36259074680588693, "3": 0.0008312286920057932, "2": 0.00021016744244105903, "1": 4.818027687996412e-07}, "score": 4.361338011831444}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5234103419031523, "4": 0.47657053955628637, "3": 1.607871838202919e-05, "2": 2.6247786218772366e-06, "1": 0}, "score": 4.523389230856854}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8352557780667232, "5": 0.1644716276408307, "3": 0.00023966534584605683, "2": 3.243517746207684e-05, "1": 0}, "score": 4.164167173000744}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9602802846078687, "2": 0.019929982955022945, "3": 0.014581087014534954, "5": 0.005199046685048926, "1": 7.0066209916418125e-06}, "score": 3.950736846201658}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7248440867595993, "5": 0.2751197834416129, "3": 2.6858640028536357e-05, "2": 8.584536968620597e-06, "1": 0}, "score": 4.275075944600784}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9489852719875135, "5": 0.05029437686871873, "3": 0.0003961918477537421, "2": 0.0003233623619299723, "1": 0}, "score": 4.049251499547304}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9495271976109604, "5": 0.050323093093866386, "3": 0.00011902630962543625, "2": 3.0094564015825906e-05, "1": 0}, "score": 4.050143907161964}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9860664683814763, "3": 0.007890021651170859, "2": 0.004937449384736736, "5": 0.0011016938719410744, "1": 2.4864464383622533e-06}, "score": 3.9833292827666282}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8968363276144112, "2": 0.08606676041377617, "3": 0.016684802563872423, "5": 0.00028262715569257665, "1": 0.00011598995099081247}, "score": 3.811113785401585}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9786104839223513, "5": 0.020955131966730458, "3": 0.00037785625970294804, "2": 5.6163302206616696e-05, "1": 0}, "score": 4.020464956563094}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9461563734128313, "2": 0.029478402571047717, "3": 0.022957803006026074, "5": 0.001400434966861363, "1": 3.2104578454881183e-06}, "score": 3.9194758914195558}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8354244666504591, "5": 0.16450483781490563, "3": 6.451808408815974e-05, "2": 5.726305497626372e-06, "1": 0}, "score": 4.164428941301124}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8632851114326983, "5": 0.13659153541235824, "3": 0.00010653787523807906, "2": 1.633811232486474e-05, "1": 0}, "score": 4.136452386423098}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9631321415095101, "5": 0.035082080708358, "2": 0.0009204114128494976, "3": 0.0008646465043934252, "1": 3.286774375823924e-07}, "score": 4.032375638010897}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7055457938609496, "5": 0.294115244604552, "3": 0.00025994681644682046, "2": 7.805018817899799e-05, "1": 3.9081423193589696e-07}, "score": 4.293698193468298}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5389472927286372, "4": 0.46098604850042546, "3": 5.428503323765483e-05, "2": 1.1924839266272432e-05, "1": 0}, "score": 4.538869399914496}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8354761308969189, "4": 0.1645150045280308, "3": 6.388551484586146e-06, "2": 2.2425924893649413e-06, "1": 0}, "score": 4.835465452184056}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7310532181759518, "4": 0.2689394547479427, "3": 4.154186238422745e-06, "2": 2.945759144661929e-06, "1": 0}, "score": 4.731043338513826}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9492955241506505, "2": 0.02339670683662337, "5": 0.013970807569155166, "3": 0.01333103771146065, "1": 3.7074731686760963e-06}, "score": 3.9538351314516396}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7981794357334475, "4": 0.20181135581993748, "3": 6.7032236867866626e-06, "2": 2.176218109170224e-06, "1": 0}, "score": 4.798168642674873}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9805377307049349, "5": 0.00889043499350863, "3": 0.006304262418454762, "2": 0.004265677327411888, "1": 6.449913055557625e-07}, "score": 3.9940528755149987}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5621726161914876, "5": 0.43782047371123084, "3": 5.266882112497055e-06, "2": 1.5568873786533032e-06, "1": 0}, "score": 4.437812130849714}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9887674673131828, "5": 0.006558972627189182, "3": 0.0026089790571911234, "2": 0.0020638723070829966, "1": 2.111555017045325e-07}, "score": 3.999821615400573}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8155121811501056, "4": 0.16058385689298438, "3": 0.01948103209269602, "1": 0.003230271789278909, "5": 0.0011883505806718}, "score": 2.3409849946223096}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8021047088295078, "2": 0.1052132327491625, "3": 0.0679307686852116, "5": 0.024602894016894982, "1": 0.00014629418468153842}, "score": 3.7458062430823533}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7227341705647745, "4": 0.27431894958340325, "3": 0.002647634444757422, "2": 0.0002970562628194474, "1": 1.214001050507393e-06}, "score": 4.7194894831965}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9046055650605894, "5": 0.08414143046113426, "3": 0.009008097355249987, "2": 0.002242292721920364, "1": 1.5194973022662366e-06}, "score": 4.070644266518813}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5067909438361302, "2": 0.42014444927027983, "3": 0.06858669592581297, "5": 0.004316624706732557, "1": 0.0001572329648326319}, "score": 3.0949656629736126}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8594128718812786, "5": 0.1402952988886463, "3": 0.0002076555210482379, "2": 8.390041484383e-05, "1": 0}, "score": 4.1399198807771995}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.8961244773882078, "4": 0.08872833438804223, "3": 0.011638624660200715, "1": 0.0034945488361432992, "5": 6.142363223717823e-06}, "score": 2.1856206329630354}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.813571536089918, "5": 0.18153233261736024, "3": 0.0037091735128390764, "2": 0.0011855230611142213, "1": 6.06417587442746e-07}, "score": 4.1754504390553375}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6858820190083708, "5": 0.3140196548403215, "3": 8.597757943020348e-05, "2": 1.1635800064184953e-05, "1": 0}, "score": 4.313910629407411}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9198207912804142, "2": 0.06458155727842242, "3": 0.015339470519018125, "1": 0.00016260266029606386, "5": 8.703493223105924e-05}, "score": 3.8550954039077525}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.973464819484576, "5": 0.017281069934798096, "2": 0.004951109431196067, "3": 0.004301598419028105, "1": 5.73995660936209e-07}, "score": 4.003075533215196}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9412600082402448, "5": 0.05832141085261585, "3": 0.0003749713255940501, "2": 4.273317531198997e-05, "1": 0}, "score": 4.057861023886159}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9773896319385726, "3": 0.009886154856479434, "5": 0.00734676645980321, "2": 0.005375009164213018, "1": 1.5665731988572521e-06}, "score": 3.986705881976021}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5544605610329264, "5": 0.4455215770102576, "3": 1.4568702420905339e-05, "2": 3.0064216710727746e-06, "1": 0}, "score": 4.445501123248795}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9552682766436505, "5": 0.044678494522985036, "3": 4.405207945497139e-05, "2": 9.090660410442755e-06, "1": 0}, "score": 4.04461626496388}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9597516048004971, "2": 0.02478960913754097, "3": 0.008434237198265047, "5": 0.006992228227002003, "1": 3.138423064365313e-05}, "score": 3.948884572196928}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8461231268110897, "5": 0.1042628254469775, "2": 0.03280775364212213, "3": 0.01675656093152476, "1": 4.8559777169016066e-05}, "score": 4.021745103415212}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8215015785177215, "5": 0.17219608886383786, "2": 0.003463861055795334, "3": 0.0028271209989545994, "1": 9.139809638616069e-06}, "score": 4.162414185382196}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6221413383389881, "4": 0.3773477888302913, "3": 0.0004282351916965207, "2": 8.046300857172118e-05, "1": 9.222375501421459e-07}, "score": 4.6215501888425425}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9238944365731444, "5": 0.07124309334789952, "2": 0.002805895891760402, "3": 0.002052837287609085, "1": 3.1842843119960448e-06}, "score": 4.063568946553004}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt4", "target_model": "human", "scores": {"4": 0.951013603616642, "5": 0.047348175135390816, "3": 0.001281656752619411, "2": 0.00035590322640761295, "1": 0}, "score": 4.0453547419216385}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.997087392794555, "3": 0.0017254075422951111, "5": 0.0006756793018733526, "2": 0.0005021222208888349, "1": 0}, "score": 3.9979460080140954}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9116914997055567, "5": 0.08219147440498235, "3": 0.005013713103347919, "2": 0.001101366607309289, "1": 9.288403168904655e-07}, "score": 4.074972317838289}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9193741979619036, "5": 0.08033402694714827, "3": 0.000251721560494028, "2": 3.982813443718895e-05, "1": 0}, "score": 4.080002667150063}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9239593701558861, "5": 0.07584319452660043, "3": 0.00014414194712372588, "2": 5.3026858957239866e-05, "1": 0}, "score": 4.0755930190079654}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.817514908238205, "5": 0.1824122396954091, "3": 6.616479725349885e-05, "2": 6.251200704170245e-06, "1": 0}, "score": 4.182333652006696}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7659112558001084, "5": 0.2335897283731895, "3": 0.00039177847214286876, "2": 0.0001054457452879515, "1": 0}, "score": 4.232987475832994}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.776278446772589, "5": 0.22240749869952448, "3": 0.0010793794352293457, "2": 0.00023343217363262377, "1": 5.435636640927542e-07}, "score": 4.220859778685508}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5544547392276001, "5": 0.44551689905825825, "3": 2.5971260414146508e-05, "2": 1.6602871311188165e-06, "1": 0}, "score": 4.4454879325039895}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6989628888022662, "5": 0.3006202014987564, "3": 0.0003575331045419483, "2": 5.7460775968818005e-05, "1": 0}, "score": 4.3001483218719745}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7474451457664772, "2": 0.1566730232238469, "3": 0.09210331894969268, "5": 0.0037426202921349958, "1": 3.4468317127283095e-05}, "score": 3.598189277985605}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9296071476145007, "5": 0.06526865978144603, "3": 0.004511532873298591, "2": 0.0006105695792391539, "1": 1.107264498584874e-06}, "score": 4.059532724470115}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9215030832264448, "3": 0.045878934987119244, "2": 0.030561959407550184, "5": 0.0020475240423715136, "1": 7.5008140748430615e-06}, "score": 3.8950220630800803}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9280388340823527, "5": 0.0715626635372148, "3": 0.00038144007381907735, "2": 1.6759320612147545e-05, "1": 0}, "score": 4.0711477263789355}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9589057522881502, "5": 0.036036880737555566, "3": 0.004581574328838526, "2": 0.000475407798068307, "1": 1.429582796433265e-07}, "score": 4.030504069316344}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8514626871333558, "5": 0.14340971579622572, "3": 0.0038819235029752238, "2": 0.0012407372743088202, "1": 3.7097354172246474e-06}, "score": 4.137035356620156}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9778958670746688, "5": 0.010695020710328936, "2": 0.006798168780855645, "3": 0.004599871089046947, "1": 9.752596506981008e-06}, "score": 3.9924695443317426}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9430178231972366, "5": 0.05489022485297295, "2": 0.0011753726884710493, "3": 0.0009153811701819956, "1": 3.5344250846963796e-07}, "score": 4.051623081581689}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6224426396683377, "4": 0.3775305448713099, "3": 2.035408355730105e-05, "2": 5.831542574859873e-06, "1": 0}, "score": 4.622411014515387}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9828126972045687, "5": 0.013377086478152557, "2": 0.0023983794472773336, "3": 0.0014099345416942802, "1": 8.975589825721653e-07}, "score": 4.007167707566849}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7769119931178833, "5": 0.22258901276648455, "3": 0.0003733280627786816, "2": 0.00012504923727743884, "1": 0}, "score": 4.221965723141067}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6653918924150639, "4": 0.3345800217741333, "3": 2.2802759468663275e-05, "2": 5.0091015013446555e-06, "1": 0}, "score": 4.665359253727648}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7031833783846212, "5": 0.2931304345238568, "3": 0.0030116637863282798, "2": 0.0006719930229566556, "1": 1.4699781812071614e-06}, "score": 4.288770680941796}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6001662792960086, "4": 0.3997969323127211, "3": 2.5596651904815557e-05, "2": 1.0838304344204076e-05, "1": 0}, "score": 4.600119218138564}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8517511860124996, "5": 0.14801216687235058, "3": 0.0001816216283582043, "2": 5.4532701975343893e-05, "1": 0}, "score": 4.147721552634979}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9666336900489827, "5": 0.03307639146081893, "3": 0.00016822873276741486, "2": 0.00012117061066451325, "1": 0}, "score": 4.032665838465086}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7772620397293823, "4": 0.22268931170737596, "3": 4.323531153315797e-05, "2": 5.004850578941919e-06, "1": 0}, "score": 4.777209112129771}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7309173426324215, "5": 0.2688894635501308, "3": 0.00016080308758572353, "2": 3.166400535451156e-05, "1": 1.3561375886926535e-07}, "score": 4.26866508442138}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9196390710412066, "4": 0.08035716647884165, "3": 3.2195337726296694e-06, "2": 3.612216782142803e-07, "1": 0}, "score": 4.919635296184343}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.6297712504847292, "4": 0.37022340805760673, "3": 3.8094566139785977e-06, "2": 1.0914275933356458e-06, "1": 0}, "score": 4.6297655356309075}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9782359386295326, "5": 0.019677992493603278, "3": 0.0016152676637049513, "2": 0.0004700696888983039, "1": 2.442364557417893e-07}, "score": 4.017121861086009}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9738084771933158, "2": 0.013049038840432755, "3": 0.0068763602531265195, "5": 0.00626099725905353, "1": 1.1599124846027964e-06}, "score": 3.9732829736134114}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9810230159198472, "5": 0.008894836848199571, "3": 0.005742938303856569, "2": 0.004334997263530518, "1": 1.7817598541104242e-06}, "score": 3.9944765453162514}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9044112856966492, "5": 0.09532425391688062, "3": 0.0002085208545301333, "2": 5.355258444268966e-05, "1": 0}, "score": 4.095008854674613}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.699179062518347, "5": 0.3007131676368841, "3": 9.476617653240566e-05, "2": 1.2237898338425246e-05, "1": 0}, "score": 4.300594155849631}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9117332278687276, "5": 0.08749636756702436, "3": 0.0006178389704960835, "2": 0.0001514079058542921, "1": 0}, "score": 4.08657581301259}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.5077865280982372, "5": 0.4921635790521674, "3": 3.460736629018559e-05, "2": 1.4202834508535356e-05, "1": 0}, "score": 4.492101098789522}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7422858035433204, "5": 0.2565270915168433, "3": 0.0009695815221687572, "2": 0.00021634288031847316, "1": 0}, "score": 4.255125125418777}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6076346270537499, "4": 0.3923184094101835, "3": 3.4872709409294506e-05, "2": 1.1321511153198199e-05, "1": 0}, "score": 4.607577578740885}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5311788697198132, "5": 0.4687637072461215, "3": 4.43551825651886e-05, "2": 1.2316989358177273e-05, "1": 0}, "score": 4.468695070010225}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7541648884012047, "5": 0.2448414795724113, "3": 0.0007915488201516637, "2": 0.0002001346836120869, "1": 0}, "score": 4.243650136142837}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.6852488856468366, "5": 0.3137297915540498, "3": 0.0007899048996020978, "2": 0.00022987520114985948, "1": 0}, "score": 4.312480618315487}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8598931772066571, "5": 0.13605485894284458, "3": 0.003301273420315692, "2": 0.0007482136443371896, "1": 7.976682920785934e-07}, "score": 4.131254985621529}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.615044067051715, "4": 0.38488475390967963, "3": 5.216697114624377e-05, "2": 1.8312329166908564e-05, "1": 0}, "score": 4.6149557057302895}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9837947008945106, "3": 0.007167395070049952, "2": 0.006227140751043474, "5": 0.002806792238047111, "1": 0}, "score": 3.98318504889296}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8950970328426217, "5": 0.10361499709802222, "3": 0.001169185414002005, "2": 0.00011758806685145361, "1": 3.9839454643373607e-07}, "score": 4.102209521948678}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.974660239521994, "5": 0.013687243654762149, "3": 0.010013801375024741, "2": 0.0016347081370780673, "1": 2.7849211426857456e-06}, "score": 4.000395671725819}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8894773552871691, "2": 0.07772166745952076, "3": 0.029042465281937938, "5": 0.003692335848239473, "1": 6.353008403028648e-05}, "score": 3.819015466503016}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8354009247206963, "5": 0.16450019884388906, "3": 8.957189133325833e-05, "2": 8.595953402792054e-06, "1": 0}, "score": 4.164393551533489}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8123691450456977, "5": 0.18701800188428788, "3": 0.0005505045151102634, "2": 5.986455285774055e-05, "1": 5.513334711837115e-07}, "score": 4.186346474409023}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8646808237743574, "5": 0.13260310303945505, "3": 0.001749334236004364, "2": 0.0009660741179874653, "1": 2.604070117841652e-07}, "score": 4.128920891485295}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt4", "target_model": "claude", "scores": {"2": 0.9541449336574893, "4": 0.0231516413572992, "3": 0.022439340236171404, "1": 0.00017402440673404475, "5": 8.888296976442572e-05}, "score": 2.068835328498155}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.5388679116389791, "4": 0.46091815025630983, "3": 0.00014525278334090222, "2": 6.754881745019851e-05, "1": 0}, "score": 4.538588173328308}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.8267042713413577, "4": 0.17328663601106487, "3": 6.4210172670705435e-06, "2": 2.28948421360681e-06, "1": 0}, "score": 4.826693587273391}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.5467037575263959, "5": 0.4532333340080194, "3": 4.7100685636954e-05, "2": 1.5532157589944732e-05, "1": 0}, "score": 4.453155293906933}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9911986734454207, "3": 0.004245205714368256, "5": 0.003154769008786516, "2": 0.0013999202615761713, "1": 0}, "score": 3.9961097172020543}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9861187485463332, "5": 0.009667568006101872, "3": 0.003393635545274678, "2": 0.0008187526781477575, "1": 4.0592233043215e-07}, "score": 4.004635213459643}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9634137688050386, "5": 0.035092347227091716, "3": 0.001163849189909712, "2": 0.00032827890197179954, "1": 0}, "score": 4.033271998654741}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9658575059680866, "5": 0.034098939325516296, "3": 3.809741979655673e-05, "2": 5.237119104701052e-06, "1": 0}, "score": 4.034050375164297}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9880186469314214, "2": 0.004795014723773701, "3": 0.003676465317268473, "5": 0.0035081077129421037, "1": 9.456167280905141e-07}, "score": 3.9902387680966807}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9676556223877483, "5": 0.028321642895287272, "3": 0.002938799836068308, "2": 0.0010811240414075355, "1": 1.4344142216523342e-06}, "score": 4.023216323689273}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9835068158291157, "5": 0.014474300230611683, "2": 0.0010485147919463203, "3": 0.0009697176609711903, "1": 4.3095765496948834e-07}, "score": 4.011406262628203}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.707433639233693, "5": 0.28582904260993997, "3": 0.004477854291857988, "2": 0.0022516065394989023, "1": 6.6278108289745506e-06}, "score": 4.27682843217108}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.6224313735585183, "4": 0.3775237116302887, "3": 3.802574985350782e-05, "2": 6.5054387510245725e-06, "1": 0}, "score": 4.62238057569041}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9652474602740193, "5": 0.030073202083668784, "2": 0.002430286809484652, "3": 0.002247647871526877, "1": 1.030598352125805e-06}, "score": 4.022961897348276}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt4", "target_model": "human", "scores": {"2": 0.45575533933547463, "4": 0.42814251921873325, "3": 0.11523301306838717, "5": 0.0004564419633342322, "1": 0.0004091519315979795}, "score": 2.97248166268365}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8688084185411694, "5": 0.1213128418655251, "3": 0.005853985310649071, "2": 0.0040233813422089456, "1": 8.186305121548407e-07}, "score": 4.107409697517185}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9287028327252221, "5": 0.04276259530396688, "2": 0.015487585677503229, "3": 0.01304185471307436, "1": 3.801115430357856e-06}, "score": 3.998734164205445}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7484149566107706, "5": 0.25068760916236327, "3": 0.0008361746961696219, "2": 6.05722918287165e-05, "1": 2.184577947734358e-07}, "score": 4.249729751577734}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9250757850888435, "5": 0.06913945687207913, "3": 0.004024400191345652, "2": 0.001758130236970169, "1": 1.5060729352174376e-06}, "score": 4.061594322430621}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8897450081533383, "5": 0.10963810407190626, "3": 0.0005664083349685374, "2": 4.9492223586185075e-05, "1": 0}, "score": 4.108972818869498}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9815872300417284, "5": 0.016369518526077854, "3": 0.0013228598935818455, "2": 0.0007192264489274206, "1": 4.578569673362459e-07}, "score": 4.0136068417869435}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8591555849995212, "5": 0.14025328673826276, "3": 0.0005137979824595879, "2": 7.63692828175838e-05, "1": 0}, "score": 4.139586884332736}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.665346913443443, "5": 0.33455743838486157, "3": 8.605086354247675e-05, "2": 9.06969429025585e-06, "1": 0}, "score": 4.334453424595002}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9017123195390156, "5": 0.09805666040382147, "3": 0.00018062563202560553, "2": 5.0157926510700356e-05, "1": 0}, "score": 4.097775742042603}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9576753007131408, "3": 0.029837284792352727, "2": 0.010976525850788848, "5": 0.0015089046330010731, "1": 1.5111781191295789e-06}, "score": 3.9497140108278583}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9787787929749945, "5": 0.01396152984362469, "3": 0.006292954529698456, "2": 0.0009650558332585491, "1": 1.012892964677965e-06}, "score": 4.005735428719057}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9652273592049622, "5": 0.031027182620103195, "3": 0.00312048450235663, "2": 0.0006241361651615548, "1": 4.944761092465972e-07}, "score": 4.026656951503265}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9296510251777413, "5": 0.0694814130714587, "3": 0.0007963705224161475, "2": 7.068190206063578e-05, "1": 1.3225010133104714e-07}, "score": 4.068543307840669}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9804549895586415, "5": 0.016350632457027753, "3": 0.002392626170946176, "2": 0.0008014293796719733, "1": 1.7358247331222833e-07}, "score": 4.01235462861832}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8516202733992442, "5": 0.1479894191505095, "3": 0.00031376539531156227, "2": 7.569942449451758e-05, "1": 0}, "score": 4.147524379214742}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9853705831670335, "5": 0.00966023213990872, "3": 0.0033910604140469742, "2": 0.001576989546103598, "1": 0}, "score": 4.00311519616857}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7245781612627384, "5": 0.27501886050851243, "3": 0.0003427821307270503, "2": 5.956660260078547e-05, "1": 0}, "score": 4.274557118005033}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.5155992822425588, "4": 0.4843607009159119, "3": 3.249904024460042e-05, "2": 6.812168906750047e-06, "1": 0}, "score": 4.515553522655758}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9657539793190203, "5": 0.034095290934200884, "3": 0.00012490326503268465, "2": 2.5375637443290386e-05, "1": 0}, "score": 4.033919651686764}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9570058066430439, "5": 0.035407883000598585, "2": 0.0038504278769020957, "3": 0.003731962665247701, "1": 2.6920811547446327e-06}, "score": 4.023967017763182}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8028141711988062, "5": 0.19673807567531013, "2": 0.00023035660344189232, "3": 0.00021640000237865733, "1": 3.924400697174511e-07}, "score": 4.1960599035817046}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.801486420246464, "5": 0.1964126845229302, "3": 0.0018088982874368276, "2": 0.00029071649780924245, "1": 5.030697542600658e-07}, "score": 4.194020994857801}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.855844464243564, "4": 0.14414773036137507, "3": 4.159810656464127e-06, "2": 3.3425017647412366e-06, "1": 0}, "score": 4.855833878817768}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8869862397852922, "5": 0.11276765810017508, "3": 0.0002077239548162673, "2": 3.782934249456442e-05, "1": 0}, "score": 4.112484337193711}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9269153719300789, "3": 0.04072581957826606, "2": 0.031717300178778364, "5": 0.0006380186774806178, "1": 2.1956816784335176e-06}, "score": 3.8964708777347297}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9982987732295737, "5": 0.0012442740643084198, "3": 0.00037948214916814447, "2": 7.590128071421324e-05, "1": 6.464939479701811e-07}, "score": 4.000711050528013}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8298749933135425, "5": 0.16859933123499113, "3": 0.0011720745273031037, "2": 0.00035192059155120416, "1": 5.90243602303583e-07}, "score": 4.16672182653541}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8633496185061788, "5": 0.1366017391811596, "3": 3.98132813133237e-05, "2": 8.476736745241078e-06, "1": 0}, "score": 4.13654502053043}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9955520283576313, "5": 0.002078034051020986, "3": 0.0020140996646230503, "2": 0.0003555097083828692, "1": 0}, "score": 3.9993529147572473}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9860427029868806, "5": 0.009666821698659641, "3": 0.0031877794555856226, "2": 0.0011016671011052535, "1": 0}, "score": 4.0042757124395365}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9564940392079735, "5": 0.04335944160704389, "3": 0.00011989969976247949, "2": 2.6338468680352955e-05, "1": 0}, "score": 4.043186877106148}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9620468941373317, "5": 0.03504255846590407, "3": 0.0016909885165690797, "2": 0.0012179733378996395, "1": 5.006082389169359e-07}, "score": 4.030914154988638}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8990961932109356, "5": 0.10087580220073515, "3": 2.4374086955934777e-05, "2": 3.2986739618152596e-06, "1": 0}, "score": 4.100844864228946}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9930625370745505, "5": 0.0060924072269488375, "3": 0.00048470892588742937, "2": 0.0003602050879410493, "1": 0}, "score": 4.004887288817633}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt4", "target_model": "human", "scores": {"4": 0.7239216070602124, "5": 0.2747696413976683, "3": 0.0008609733555072425, "2": 0.00044666709264725384, "1": 0}, "score": 4.273015637202892}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6511884245630079, "4": 0.34855602545326414, "3": 0.00020844590475595882, "2": 4.651056811048144e-05, "1": 1.6514268155801177e-07}, "score": 4.650886740913156}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9715273589566782, "2": 0.014984169527542801, "3": 0.010625367250670672, "5": 0.0028597787994246583, "1": 2.301358401551558e-06}, "score": 3.962259129767764}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9525731328820952, "4": 0.04742582819764468, "3": 7.558189300273071e-07, "2": 1.5355392940392514e-07, "1": 0}, "score": 4.952572193358558}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt4", "target_model": "llama", "scores": {"5": 0.7826514570200892, "4": 0.21733446471353923, "3": 1.1901834619783692e-05, "2": 1.942921091648852e-06, "1": 0}, "score": 4.7826358520971}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8696650860606928, "2": 0.11056551917827932, "3": 0.018915530022695307, "5": 0.000831090387058734, "1": 1.7796255285815464e-05}, "score": 3.760729942132632}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7971269165671684, "2": 0.15696360747904708, "3": 0.04358721960165867, "5": 0.0019150887744669605, "1": 0.00040142441453351553}, "score": 3.6431943317779574}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8584545682185613, "5": 0.14013885871005777, "3": 0.0009151965564188939, "2": 0.0004898694161644377, "1": 0}, "score": 4.138244131668874}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.6926102554136945, "5": 0.3073439193337609, "3": 3.734121057684829e-05, "2": 7.950402513108758e-06, "1": 0}, "score": 4.3072908413006745}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8030509640406066, "5": 0.1967961022894305, "3": 0.00011406843302255695, "2": 3.820813908479076e-05, "1": 0}, "score": 4.196605746767452}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8165140166260338, "2": 0.09161035205378584, "3": 0.09161035205378584, "5": 0.00024939788627371056, "1": 1.4070065943964852e-05}, "score": 3.725375634096076}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9036352089072001, "2": 0.07417488968741155, "3": 0.021926055510777614, "5": 0.00025526585175190107, "1": 7.018542377634627e-06}, "score": 3.8299581098185245}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9772116664681452, "2": 0.012301279470768263, "3": 0.007119434363803949, "5": 0.0033629826678959907, "1": 3.6417289602775268e-06}, "score": 3.9716300359390373}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9338783738033929, "5": 0.06556855778447339, "3": 0.0004282047880772514, "2": 0.00012461469763750866, "1": 0}, "score": 4.0648911397542395}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9511040768929884, "3": 0.025346064691242676, "2": 0.023077854521585093, "5": 0.00046422927528943245, "1": 5.843784150445426e-06}, "score": 3.9289447869925507}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9756067693610319, "5": 0.01731908857366646, "3": 0.005535513189256453, "2": 0.0015371564967389456, "1": 9.93958879358679e-07}, "score": 4.008706284679558}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9328556276809931, "5": 0.05871091053493444, "3": 0.0061880844437030786, "2": 0.0022411756657946783, "1": 3.215171043432873e-06}, "score": 4.048030876629141}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8629254640955436, "5": 0.1365346295767062, "3": 0.0004625864960551275, "2": 7.670436048757934e-05, "1": 1.1177230791213694e-07}, "score": 4.135918367504684}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8353387899107377, "5": 0.1644879604843677, "3": 0.00016473573072780636, "2": 8.074553374860379e-06, "1": 0}, "score": 4.164307147830437}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8079477325431188, "5": 0.1919044091390038, "3": 0.00012408943528975148, "2": 2.3315714095854032e-05, "1": 8.675879846801608e-08}, "score": 4.191733498252139}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt4", "target_model": "human", "scores": {"4": 0.8749618093799235, "2": 0.09222029991870162, "3": 0.032372369928245166, "5": 0.0004337900051772595, "1": 9.144801337288481e-06}, "score": 3.7835928262137903}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9704344880003056, "5": 0.01593263113737551, "2": 0.009663629274710414, "3": 0.003965945463451027, "1": 2.1594953453013593e-06}, "score": 3.9926329401911844}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9040968313509665, "5": 0.09529109637703144, "3": 0.00044128545573693373, "2": 0.00017013063071905305, "1": 1.0334488955346042e-07}, "score": 4.094509291873767}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5077618908935972, "5": 0.49213969985462575, "3": 8.432197928102738e-05, "2": 1.355177531044229e-05, "1": 0}, "score": 4.492028537804621}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9812903006527313, "5": 0.01797295771339532, "3": 0.00047153746494087953, "2": 0.00026450854525116957, "1": 0}, "score": 4.016972414964366}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt4", "target_model": "human", "scores": {"5": 0.8705089224739008, "4": 0.1293895833201376, "3": 8.906198232583937e-05, "2": 1.2053228603681666e-05, "1": 0}, "score": 4.87039608391016}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.6859073422399765, "4": 0.3140312737824997, "3": 5.817749278094496e-05, "2": 2.5963939965773593e-06, "1": 0}, "score": 4.685844390386519}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.8806611647787174, "4": 0.11918453174634884, "3": 0.00014624796302258581, "2": 6.947824284421439e-06, "1": 0}, "score": 4.8805019964882925}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9626727773451229, "4": 0.03732687135657103, "3": 2.329558235161355e-07, "2": 2.7822605477550148e-08, "1": 0}, "score": 4.962672575885092}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.6295236227440492, "5": 0.3700778463253395, "3": 0.00036488913144089443, "2": 3.238578389907967e-05, "1": 0}, "score": 4.3696486499104505}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9738161605725117, "5": 0.02595132528399814, "3": 0.0001920445848755967, "2": 4.0254731830630565e-05, "1": 0}, "score": 4.02567877675195}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.9933997007967933, "5": 0.004321631439434228, "3": 0.0018298938852724309, "2": 0.00044843478228695244, "1": 0}, "score": 4.001594868530401}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8957266058209755, "5": 0.1036878847882899, "3": 0.0005191877431693019, "2": 6.600731425715863e-05, "1": 0}, "score": 4.103036714804477}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.9720180555747858, "5": 0.02757402975877852, "3": 0.00035257189466915856, "2": 5.492010858048991e-05, "1": 0}, "score": 4.027111629106036}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9965788726376418, "5": 0.001807289626349493, "3": 0.0010624507618794841, "2": 0.0005511921941068441, "1": 0}, "score": 3.999642454406614}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt4", "target_model": "human", "scores": {"4": 0.5232868735001959, "5": 0.4764581202960916, "3": 0.00023255704690527702, "2": 2.197181636942361e-05, "1": 0}, "score": 4.476181846917299}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.8900514401543067, "5": 0.10967585897027102, "3": 0.00017552553975090507, "2": 9.543158067124637e-05, "1": 0}, "score": 4.109309660878445}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt4", "target_model": "gpt35", "scores": {"5": 0.7605781585345628, "4": 0.23932653602861098, "3": 8.680893533054079e-05, "2": 7.826062875714371e-06, "1": 0}, "score": 4.7604762073261}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.5925826393514689, "5": 0.40727569482392184, "3": 0.00010978188766604203, "2": 3.145303742468758e-05, "1": 0}, "score": 4.407103182281972}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.4999720160631026, "5": 0.4999720160631026, "3": 4.88098705592349e-05, "2": 6.402461705947177e-06, "1": 0}, "score": 4.499910778972486}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt4", "target_model": "human", "scores": {"4": 0.984907256579335, "5": 0.012016699158807376, "3": 0.0027235121499433745, "2": 0.0003517084474023878, "1": 0}, "score": 4.008589777189154}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.986701128902879, "5": 0.008807620203368524, "2": 0.0027284734554748205, "3": 0.0017616348659249366, "1": 4.748518387450096e-07}, "score": 4.0015876149310605}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.956558826656304, "5": 0.042028261253399896, "3": 0.0012110252065142702, "2": 0.0002008076647117379, "1": 0}, "score": 4.040415664334818}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7121819375112611, "5": 0.28774750561544815, "3": 6.330495207763029e-05, "2": 6.467007989982256e-06, "1": 0}, "score": 4.287671492444549}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.8513834451886455, "5": 0.14794825422040914, "3": 0.0005591920969072286, "2": 0.00010840433272171284, "1": 0}, "score": 4.147172357091139}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt4", "target_model": "human", "scores": {"2": 0.8278695047305169, "4": 0.11559647688287794, "3": 0.05633722343794037, "1": 0.0001486523796855704, "5": 4.533641433199289e-05}, "score": 2.2875183408879356}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7755836626340084, "2": 0.1600507382429333, "3": 0.06074840817411544, "5": 0.0033217470984289155, "1": 0.00028575121595151995}, "score": 3.621610941203723}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.8944607108747168, "5": 0.10354133231038959, "3": 0.001726715897015966, "2": 0.00026897045960161197, "1": 6.772102845028213e-07}, "score": 4.101274805219196}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.8555557938077749, "5": 0.1440991031210279, "3": 0.000273863979505056, "2": 7.033408682936384e-05, "1": 0}, "score": 4.143684701003218}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9802088978124424, "5": 0.008092120245396755, "2": 0.00630214958382296, "3": 0.005390514198515387, "1": 5.1514104860536964e-06}, "score": 3.990081841075772}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt4", "target_model": "human", "scores": {"4": 0.9746916153147708, "5": 0.013060873157235304, "3": 0.007799003576885639, "2": 0.004443738288124471, "1": 3.98934300907518e-06}, "score": 3.9963624221365985}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt4", "target_model": "claude", "scores": {"5": 0.7121042640633353, "4": 0.2877161140750252, "3": 0.0001448906844810507, "2": 3.388100585048353e-05, "1": 1.5937100308986876e-07}, "score": 4.711891625029096}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.9364471520784661, "2": 0.027839842523928543, "3": 0.01854533322030626, "5": 0.01715162427401125, "1": 1.4464878777098738e-05}, "score": 3.942883120952097}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt4", "target_model": "gpt4", "scores": {"5": 0.9046482815438998, "4": 0.09534923214341165, "3": 1.8045325045050578e-06, "2": 5.767632307347826e-07, "1": 0}, "score": 4.904645418488039}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt4", "target_model": "llama", "scores": {"4": 0.9291303238426699, "5": 0.06322810356546155, "2": 0.0044393096449443555, "3": 0.003197514786908996, "1": 3.8028643456755056e-06}, "score": 4.051140609238624}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt4", "target_model": "human", "scores": {"2": 0.5885166502433782, "4": 0.34597111156389915, "3": 0.061067528653800884, "5": 0.003287427286163925, "1": 0.0011539955119829759}, "score": 2.7617205417060706}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt4", "target_model": "claude", "scores": {"4": 0.7013804812046208, "2": 0.2423906253096486, "3": 0.052420638536463095, "5": 0.0030039415579895612, "1": 0.0007959652729649723}, "score": 3.4634096770638325}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt4", "target_model": "gpt35", "scores": {"4": 0.7026264949486262, "2": 0.20130586724301944, "3": 0.05503396163730642, "5": 0.040897767572603314, "1": 0.0001301686032164743}, "score": 3.5828591712532423}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt4", "target_model": "gpt4", "scores": {"4": 0.7750903544789558, "5": 0.21523483308826175, "3": 0.0060110820803152476, "2": 0.003645905579760396, "1": 1.5615040087335922e-05}, "score": 4.201885540841229}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt4", "target_model": "llama", "scores": {"2": 0.5815928770504787, "4": 0.2580802747534662, "3": 0.1589986448109183, "1": 0.0006916990470855017, "5": 0.0006297991493280454}, "score": 2.676361427849768}]