[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5885313986554301, "3": 0.38647364583251925, "2": 0.024294230130962362, "5": 0.000645973549542882, "1": 5.466122316588711e-05}, "score": 3.5654198444089973}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6339568796679148, "2": 0.32023611368631516, "4": 0.04553780586036065, "1": 0.0001986575638825325, "5": 7.053962142386608e-05}, "score": 2.725045455299264}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6981758875984524, "5": 0.2922367551297457, "3": 0.009586667000257752, "2": 4.424457406574657e-07, "1": 0}, "score": 4.28264927328579}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6031270246270081, "5": 0.3918772993705177, "3": 0.004994592758675744, "2": 3.6646053579949867e-07, "1": 0}, "score": 4.386882251001493}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9902311393632952, "2": 0.007648750330330582, "4": 0.001677710017891881, "5": 0.0004423084803390008, "1": 1.2074716777117364e-07}, "score": 2.9949133353011064}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9308826750507071, "5": 0.05706736881597758, "3": 0.011946081049966934, "2": 0.00010302807850916974, "1": 0}, "score": 4.044915269652442}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8927121772223752, "2": 0.10310878325270427, "3": 0.002980096191377621, "4": 0.0010142011709993993, "5": 0.0001841798190747434}, "score": 1.1128483618842957}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5588369108527028, "2": 0.21520685437861584, "3": 0.16735666925209391, "5": 0.040787292680221694, "1": 0.017810833201220025}, "score": 3.389583536290241}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5489655444537308, "4": 0.4501143578263275, "3": 0.0006972336367501786, "1": 0.00011187918211885152, "2": 0.0001059236506778604}, "score": 4.547723598135546}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8131592330516538, "3": 0.13721617185133464, "5": 0.049598395230423364, "2": 1.4046799243333043e-05, "1": 0}, "score": 3.9123530646014943}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.431833319362697, "3": 0.3954661236227024, "4": 0.15576554794574024, "1": 0.014133435170194554, "5": 0.002800514860372869}, "score": 2.70126607159273}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9998010091513059, "3": 0.00012533135348869628, "4": 4.882900777914415e-05, "1": 2.432205514789828e-05, "5": 4.3269142817483367e-07}, "score": 2.0001999654033296}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9989169272471365, "4": 0.0010788392331079416, "3": 3.471152106317442e-06, "1": 0, "2": 0}, "score": 4.998914217634915}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7912389902472657, "5": 0.20871186804185182, "3": 3.4880521771154086e-05, "1": 0, "2": 0}, "score": 4.208679963544504}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9700753840392699, "4": 0.029914382325649195, "3": 2.8964433635795143e-06, "1": 0, "2": 0}, "score": 4.97007960525595}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9922070705566829, "3": 0.0071035934731004825, "4": 0.0005876100560753384, "1": 9.896750440945449e-05, "5": 1.956485121453088e-06}, "score": 2.008185722100538}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5290110282434632, "2": 0.46183425854678156, "4": 0.007752072903202549, "1": 0.0012445034051515812, "5": 0.00015798918131050405}, "score": 2.543744718510667}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8469952266010307, "3": 0.07065550171922182, "5": 0.059908414975286116, "2": 0.022426353861377542, "1": 1.3174624037462314e-05}, "score": 3.9443606077598963}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7237863694199829, "3": 0.2749400513969758, "4": 0.0011390629821962362, "5": 0.00011698392801446717, "1": 1.6967276172468824e-05}, "score": 2.277552318685372}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9563420261261814, "3": 0.028928587093132594, "2": 0.012416073447577699, "1": 0.0016427107587627344, "5": 0.0006701084453135664}, "score": 3.9419812135119705}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8736569990103725, "3": 0.07577859606662678, "5": 0.04441609389986703, "2": 0.006145273679593881, "1": 2.8558700934732118e-06}, "score": 3.956338374940347}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8650655799093152, "4": 0.1333145107343487, "3": 0.001514790096173989, "2": 9.909723679639151e-05, "1": 5.391386340960875e-06}, "score": 4.863336965632781}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5048312570504646, "4": 0.4898781952016598, "3": 0.005179788777948219, "2": 0.00010902678194483144, "1": 1.263547900342245e-06}, "score": 4.499429858117775}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7781059512110929, "4": 0.21836290465901412, "3": 0.00335425697850323, "2": 0.00015852567347558136, "1": 1.6424835645597167e-05}, "score": 4.774386868089043}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4536114882769933, "2": 0.31147817730951655, "4": 0.2273595940794, "5": 0.007014418939541686, "1": 0.0005356436232616762}, "score": 2.9288389191715067}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5188153185950247, "4": 0.34765902248183855, "2": 0.13183119507234883, "5": 0.0016847341535484324, "1": 9.628327723859831e-06}, "score": 3.219178061279112}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6143699548227991, "5": 0.36860351415567977, "3": 0.016408734409178744, "2": 0.0006166972100350531, "1": 8.673866469526402e-07}, "score": 4.350958864594443}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9775949893873953, "4": 0.022157941810590453, "3": 0.00018761285505358537, "2": 5.840290069083281e-05, "1": 0}, "score": 4.977291599864234}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9661941418136604, "4": 0.03277054124268387, "2": 0.0008274062915213631, "3": 0.0002034980775611913, "1": 0}, "score": 4.964340086375602}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7943729640500028, "5": 0.19341148752038598, "3": 0.012179495961840158, "2": 3.4539705901640014e-05, "1": 0}, "score": 4.181163186203503}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8270886706969179, "4": 0.1267288518172284, "2": 0.045958245556519985, "5": 0.00019140001511015406, "1": 3.2783998900678055e-05}, "score": 3.0810878421784773}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9977671911344479, "4": 0.0021744750497704906, "1": 5.280133940789715e-05, "3": 4.195858880110344e-06, "2": 1.1644973771087907e-06}, "score": 4.9976024339700365}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9893767980391839, "4": 0.010621032985082702, "3": 5.657627591827117e-07, "1": 0, "2": 0}, "score": 4.989377818459779}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9899516108275868, "4": 0.009885087209408913, "1": 0.00015291077142436574, "3": 8.57429314825782e-06, "2": 1.4310716339179223e-06}, "score": 4.989481823845502}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5570626877808987, "5": 0.43935352230076835, "3": 0.0035770361947918246, "2": 5.29906589057954e-06, "1": 9.598517418344959e-07}, "score": 4.435763224037188}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4701756832371761, "2": 0.4022715181788865, "4": 0.12580338843288028, "5": 0.001594165304161656, "1": 0.00015365034869182825}, "score": 2.7264124639300986}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9654378750799438, "3": 0.030906359722301036, "1": 0.003229672629435792, "4": 0.00042231697512225795, "5": 3.768309747041214e-06}, "score": 2.0285326261801666}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8317746485142098, "4": 0.16707930484057257, "3": 0.001135111948355888, "2": 5.054578963796492e-06, "1": 0}, "score": 4.830634311635608}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.774421654865276, "4": 0.07340075920667274, "5": 0.07058169116893798, "2": 0.06420655311840252, "3": 0.017377674001598484}, "score": 1.601497961478511}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4947864616971056, "4": 0.46057985453147987, "3": 0.024917642307305317, "5": 0.01970738185448702, "1": 5.177294165727607e-06}, "score": 3.005197820055466}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6549785054449013, "3": 0.23282103748595825, "2": 0.0600685301122965, "5": 0.052092671620061565, "1": 3.8245754397348834e-05}, "score": 3.69901953278174}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5835207305218467, "4": 0.3853601066137785, "3": 0.02982093545750255, "2": 0.0012648400594672661, "1": 3.1958623738268894e-05}, "score": 4.551075026408127}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7162730929549882, "4": 0.27450837732776456, "3": 0.008438638487787932, "2": 0.0007315814479182652, "1": 4.70857570859074e-05}, "score": 4.706230898743997}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9885501601068042, "5": 0.01144558285807678, "3": 3.0462080595400274e-06, "1": 0, "2": 0}, "score": 4.011442550504968}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9312951194927873, "5": 0.06852582482622414, "3": 0.0001740764478114116, "2": 2.5686194047352635e-06, "1": 0}, "score": 4.0683467758972816}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4919582469567593, "2": 0.4855316999370958, "4": 0.02068925077124465, "1": 0.001792849007713986, "5": 2.795118394132521e-05}, "score": 2.531627754182767}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9063670341683232, "4": 0.09286643508577047, "3": 0.0005369496121397031, "1": 0.00019558216216452635, "2": 3.324660171984577e-05}, "score": 4.905177525894559}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9393905735339498, "1": 0.031135071319709846, "4": 0.02882177215048093, "3": 0.00045243443515844995, "2": 0.00019360781833024324}, "score": 4.84515123741951}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8071940589836412, "1": 0.1538712600331794, "4": 0.0387241826276285, "3": 0.00015805681515271465, "2": 4.716506913745348e-05}, "score": 4.345329714052988}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7131409230936266, "5": 0.26019854624161226, "3": 0.018513371947958365, "1": 0.005965866320676926, "2": 0.0021804750785133263}, "score": 4.219426804515988}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.37971988607207086, "1": 0.37942884364633056, "3": 0.12672143839624175, "2": 0.10279611690213881, "5": 0.011326563044071177}, "score": 2.5407159231936447}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7497130842332743, "5": 0.2309057408507136, "3": 0.01925447072035195, "2": 0.00012296731126328165, "1": 0}, "score": 4.211406125508087}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998776117755515, "4": 0.0012066126596624678, "3": 1.6237096924776192e-05, "1": 0, "2": 0}, "score": 4.998760911867144}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7314496441921163, "5": 0.24147621484368473, "3": 0.026271494156218652, "2": 0.0008006116179157802, "1": 0}, "score": 4.213603932176235}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5478901545653119, "4": 0.4503504596960713, "3": 0.0016741947090982525, "2": 7.946610336452301e-05, "1": 0}, "score": 4.546060153803541}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8045282485421692, "1": 0.1951319075758577, "3": 0.0003376933239304096, "4": 1.8602568283746146e-06, "5": 2.3570637035100503e-07}, "score": 1.805210202746322}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9577343393844588, "3": 0.02958321024605824, "1": 0.011954386462093068, "4": 0.0007107906613461764, "5": 1.7195187668630474e-05}, "score": 2.019101992160734}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5461318002327542, "4": 0.22328805826569836, "2": 0.22010318937109127, "5": 0.008773649715905593, "1": 0.001702822688275849}, "score": 3.0173265312618582}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6066914298368891, "3": 0.3748197632070164, "5": 0.015646281407094002, "2": 0.0028388591933257374, "1": 0}, "score": 3.6351474621342534}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5982739258082733, "3": 0.3881727913351362, "5": 0.007523546824644258, "2": 0.006019153163929659, "1": 1.037964376686435e-05}, "score": 3.607281230420371}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9577907707541872, "4": 0.04220698712344613, "3": 4.570367653246512e-07, "1": 0, "2": 0}, "score": 4.957792023458172}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.576487495431515, "4": 0.4178214670568533, "3": 0.00556572903077539, "2": 0.00011914229772804772, "1": 3.9416939125635435e-06}, "score": 4.570672926179316}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982589856269047, "4": 0.0017248675742437807, "3": 1.4685646056022505e-05, "1": 0, "2": 0}, "score": 4.998245758570429}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.932916116000902, "4": 0.067079888783272, "3": 1.2322559041686427e-06, "1": 0, "2": 0}, "score": 4.932917461358554}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5157882840119593, "5": 0.45566540489382973, "3": 0.02844239401065481, "2": 9.41308238675017e-05, "1": 0}, "score": 4.4270389283492895}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6452282685933526, "1": 0.3514943647027666, "3": 0.00315569664723127, "4": 0.0001050537955957948, "5": 1.6515800982415228e-05}, "score": 1.6519209519705575}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9909362685126625, "3": 0.007696301424504462, "4": 0.0011085776297625476, "1": 0.0001768732824754618, "5": 8.194493997108792e-05}, "score": 2.009982418562972}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6906118052354241, "4": 0.30728946281624486, "3": 0.0020952298877608927, "2": 2.976964204560703e-06, "1": 0}, "score": 4.6885109829538685}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7277101177412298, "4": 0.2655021607274804, "3": 0.006190706890608025, "2": 0.0005910389721547909, "1": 3.484384999696123e-06}, "score": 4.720328674294273}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7780348589182317, "5": 0.21112614089179485, "3": 0.010607984571085015, "2": 0.00023038447827730235, "1": 3.2832495583214406e-07}, "score": 4.200056462969517}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7810914285414232, "3": 0.1378153545868666, "5": 0.07662652368226044, "2": 0.004437627465382086, "1": 2.8220609884237938e-05}, "score": 3.9298511930512254}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7098918957829913, "3": 0.14853913798640742, "5": 0.12001884582371049, "2": 0.020818074567895844, "1": 0.0007252339249848948}, "score": 3.9276673642028617}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7333685109331805, "3": 0.19941591703325912, "2": 0.048554839911312646, "5": 0.01662071450175931, "1": 0.0020369709561262814}, "score": 3.7139833333807113}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957214870277094, "4": 0.00427456729183731, "3": 2.6611452040043295e-06, "1": 0, "2": 0}, "score": 4.995720104920079}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5543379279205483, "4": 0.40898414048968273, "3": 0.02235249569389861, "2": 0.010066934879151865, "1": 0.004251258169392096}, "score": 4.4991014028754295}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8037836484364246, "4": 0.1215297001979433, "3": 0.06768934479521817, "5": 0.006951093455876444, "1": 4.6063070626462404e-05}, "score": 2.3315560122360686}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8508380534391476, "2": 0.1489568518312032, "3": 0.00019752191850672715, "4": 6.823957334949269e-06, "5": 6.868272719430309e-07}, "score": 1.1493751241145305}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6654480538607634, "4": 0.3301490697513755, "3": 0.003945962794847639, "2": 0.00045625759802534496, "1": 0}, "score": 4.660590009213601}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.4297023368014043, "4": 0.35196730190997655, "5": 0.21018812835261327, "3": 0.008134735928447217, "1": 6.398698165053546e-06}, "score": 3.342628800729899}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.878992107755459, "4": 0.10336271209323036, "2": 0.016724989512890497, "5": 0.000918945905216435, "1": 7.746775179965601e-07}, "score": 3.088474106623494}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9964441560399442, "1": 0.0027348073071892546, "3": 0.0007667671408647721, "4": 5.0757305482913774e-05, "5": 3.5471184085432418e-06}, "score": 1.9981441158646596}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8607607910868285, "2": 0.1389037266289045, "3": 0.0003300362701493085, "4": 3.485423501155061e-06, "5": 2.0713365142026874e-06}, "score": 1.1395825253275715}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984016722884271, "4": 0.001596604647314326, "3": 1.3028062059603372e-06, "1": 0, "2": 0}, "score": 4.998400789068192}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9105568113403987, "4": 0.08747803899800372, "3": 0.0018624750570279396, "2": 9.904056938536858e-05, "1": 2.7235891691838193e-06}, "score": 4.908488911507202}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929868260923941, "4": 0.007004377277528808, "3": 8.061805653879635e-06, "1": 0, "2": 0}, "score": 4.992979493952324}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9721278774622073, "2": 0.02783396893684122, "3": 3.690132867918725e-05, "4": 9.801658940158098e-07, "5": 9.294294747987044e-08}, "score": 1.0279110888643181}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9915835711299029, "4": 0.008409838571576442, "3": 6.212556947400246e-06, "2": 3.6490711324894395e-07, "1": 0}, "score": 4.9915766414850795}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8888610241313224, "5": 0.10939159719868957, "3": 0.0016785113157200568, "2": 6.121012138575069e-05, "1": 0}, "score": 4.107591489493289}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935465415879404, "4": 0.005807448274684565, "1": 0.0005699978323714585, "3": 5.317107566380214e-05, "2": 2.1881763170419126e-05}, "score": 4.991740565030342}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7786364968005469, "4": 0.22135801739880595, "3": 1.4455336451123616e-06, "1": 0, "2": 0}, "score": 4.778638197173116}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6125589477314117, "4": 0.2500207911444681, "2": 0.13694183573261004, "5": 0.0002724972597158942, "1": 0.00020555087248357208}, "score": 3.11321289089694}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.971485051804453, "5": 0.026110770158996766, "3": 0.002301732220882841, "2": 9.769511501617629e-05, "1": 3.792561157300324e-06}, "score": 4.023602292638898}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5948479811179803, "4": 0.3824924364109791, "5": 0.022599194837451035, "2": 5.737981336674991e-05, "1": 0}, "score": 3.427634732520911}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7164067548209986, "4": 0.28164910256353404, "3": 0.0010029997693123726, "1": 0.0008445817698980033, "2": 8.925639385844549e-05}, "score": 4.712696702977337}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7167350302725508, "4": 0.28089650137631567, "3": 0.002270835621564412, "2": 8.703597665651254e-05, "1": 8.014974126842363e-06}, "score": 4.714267921857061}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8499482871462426, "2": 0.1499092302078173, "3": 0.00014030372794060408, "4": 1.8396945602261067e-06, "5": 2.5550981836447316e-07}, "score": 1.1501963913601363}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9792393638714079, "2": 0.020754095049367146, "3": 6.2169259104448455e-06, "4": 0, "5": 0}, "score": 1.0207665356327293}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.793393740814263, "1": 0.20627195725821093, "4": 0.00027574666339849185, "3": 3.374814854757876e-05, "2": 1.8824770040443863e-05}, "score": 4.174507515315258}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9989351274795695, "3": 0.0006049105270764156, "1": 0.0004581545432913078, "4": 1.6728044978841946e-06, "5": 9.594267109048968e-08}, "score": 2.000150389426614}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7043317697391501, "3": 0.2615491392836572, "2": 0.017003841327669363, "5": 0.01698847680092158, "1": 0.00012475259773779419}, "score": 3.721056833533539}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"1": 0.575260671024821, "2": 0.41724573424147604, "3": 0.007032953031365283, "4": 0.0004453895346219565, "5": 1.5107775694912394e-05}, "score": 1.4327083024904783}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7210737344537135, "5": 0.25229503562629335, "3": 0.024788786136179505, "2": 0.0016680721843379104, "1": 0.0001722897337122206}, "score": 4.223653701537285}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5083020100912077, "5": 0.37855083827447267, "3": 0.050278436078000165, "2": 0.034498928962221696, "1": 0.02836495144493686}, "score": 4.174180532126072}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.870663425401784, "2": 0.12418573141743672, "5": 0.0039864650226890475, "4": 0.0010670871845706413, "3": 9.322906767256015e-05}, "score": 1.1435198941615474}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8284017474790936, "5": 0.14016391777820908, "4": 0.023882999288467797, "2": 0.006269087307029473, "3": 0.00127945893173439}, "score": 1.6411344624108963}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8568307167008701, "5": 0.13044883474745606, "3": 0.011703884309625316, "2": 0.0010145744657123416, "1": 1.9873529113986736e-06}, "score": 4.116709839730508}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9773846150104679, "3": 0.01949090563290756, "4": 0.0031169843470791546, "5": 4.594452318551558e-06, "1": 2.914247263947384e-06}, "score": 2.0257357430844345}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9985066127142245, "4": 0.0014854121546755011, "3": 7.0695127386461465e-06, "1": 1.7604714648947457e-07, "2": 0}, "score": 4.9984997435367164}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.997555638229451, "1": 0.002174615960319169, "4": 0.00026791065765272, "3": 9.4060457832094e-07, "2": 3.4775382740724136e-07}, "score": 4.991030696126068}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8931045211446939, "5": 0.1027893736980496, "4": 0.0037549939685963215, "2": 0.0002510877696690258, "3": 9.620819661732154e-05}, "score": 1.4228675941947972}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9336233010887139, "2": 0.06617625276211214, "3": 0.0001950760647147353, "4": 4.448031140628147e-06, "5": 7.411787593914474e-07}, "score": 1.0665827257431224}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6724498384187431, "3": 0.2882401477352302, "2": 0.03274033418016721, "5": 0.006407664032344233, "1": 0.00016148908544003513}, "score": 3.652202197548196}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7264322032570941, "5": 0.2671793294913828, "3": 0.006329718592344249, "2": 5.791518182905905e-05, "1": 0}, "score": 4.260733997851262}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5573028558391413, "4": 0.4411320126139989, "3": 0.001556500884220835, "2": 6.7778541714036474e-06, "1": 0}, "score": 4.5557338289149225}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7217587407623421, "5": 0.2740197760044085, "3": 0.004121877564048566, "2": 9.879851338837697e-05, "1": 0}, "score": 4.269700519103925}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7710514778563519, "3": 0.16203973435956248, "5": 0.05385864229261803, "2": 0.012973422983689312, "1": 7.663083626637073e-05}, "score": 3.865642157140091}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5441168812311219, "1": 0.45472553582835373, "3": 0.0011358386525233651, "4": 2.0561945425311574e-05, "5": 1.1378341170233497e-06}, "score": 1.5464548200307744}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.940347447511829, "4": 0.059528279120730256, "3": 0.00011598496353015106, "2": 7.530387926620271e-06, "1": 0}, "score": 4.9402171144720475}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9404350496585276, "4": 0.059356935923186305, "3": 0.0002036660327471671, "2": 3.3176263020843036e-06, "1": 0}, "score": 4.940225717519519}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5667351624494096, "4": 0.3580603970382773, "2": 0.07120524482533756, "5": 0.003813449953327186, "1": 0.00018454264185920055}, "score": 3.294113320681197}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9794032072600647, "2": 0.02038518229797723, "3": 0.00018781333261874662, "4": 2.0983156783289617e-05, "5": 2.731540014338799e-06}, "score": 1.0208346863106614}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9662009245203432, "3": 0.027498550081738626, "4": 0.003296905426557146, "1": 0.002967296529894141, "5": 3.621764959780115e-05}, "score": 2.0312337206580255}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5958321375459417, "2": 0.3097947802235786, "4": 0.09324000604331169, "5": 0.0011237742419970016, "1": 8.934521180398244e-06}, "score": 2.7856748265131555}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7806314074761506, "2": 0.21923341386716563, "3": 0.0001211135527450852, "4": 1.1812574007250206e-05, "5": 1.587376348375971e-06}, "score": 1.2195175742129722}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9972652030890398, "1": 0.0027289182328964373, "3": 5.142246560289128e-06, "4": 5.158591880925295e-07, "5": 8.235497246969759e-08}, "score": 1.9972775024206608}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7210284812861985, "3": 0.21957015165724716, "4": 0.04747650129165983, "1": 0.009822611059035069, "5": 0.0021019279163565535}, "score": 2.3110064285642373}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6134964508091897, "1": 0.38192383693716003, "3": 0.004502193304262053, "4": 7.147291437248259e-05, "5": 5.9312771330881645e-06}, "score": 1.6227390527335788}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6374083735781012, "4": 0.34232732807939775, "3": 0.020010430827671694, "2": 0.0002510503603784064, "1": 2.2517677129714193e-06}, "score": 4.616889435507639}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9857865140632114, "4": 0.013078952764951418, "3": 0.000995418804816363, "5": 0.00013583508748973407, "1": 2.5124881525328704e-06}, "score": 2.027558338240532}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9930571321477887, "4": 0.005929378959739536, "2": 0.0006828850596753418, "3": 0.00032956893993615856, "1": 0}, "score": 4.991362819042805}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8153152831971543, "1": 0.18365765959820526, "3": 0.0010227031603036473, "4": 4.142914633821797e-06, "5": 1.4712401005304893e-07}, "score": 1.817373759074277}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.878446563660601, "1": 0.12059676732282634, "3": 0.0009537509302554016, "4": 2.7416626912006488e-06, "5": 1.0109562356873691e-07}, "score": 1.880362761207648}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9889559581991274, "4": 0.010872177238237853, "3": 0.00016310539027288387, "2": 3.4988997361175097e-06, "1": 0}, "score": 4.988791056319908}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9730799827158328, "3": 0.01967065200405739, "5": 0.005344098558953049, "2": 0.0018983361253112274, "1": 6.572311242760788e-06}, "score": 3.9818570508702056}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8472822541462982, "5": 0.15270123179884623, "3": 4.0231193440515745e-06, "1": 0, "2": 0}, "score": 4.152699116034313}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8586623050168718, "5": 0.10151685857068111, "3": 0.03735002492752198, "2": 0.0023023183165130873, "1": 0.00016819996811355965}, "score": 4.059057614421502}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8537697799920624, "3": 0.11040401257627967, "2": 0.02834782418721664, "5": 0.007084460893384501, "1": 0.000393558828754081}, "score": 3.838804064858092}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8267462276477606, "4": 0.17256218753994287, "3": 0.000687954813665215, "2": 3.00575431954056e-06, "1": 0}, "score": 4.826052776984203}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9997228521625594, "3": 0.00013531299250693133, "2": 8.045906598089552e-05, "5": 5.9898385887035916e-05, "1": 8.93143120138061e-07}, "score": 3.999760987692415}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8905241509122686, "4": 0.10903726221376536, "3": 0.0003881031124151314, "2": 4.6215653357513095e-05, "1": 0}, "score": 4.890047415311804}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9699534600166824, "2": 0.02997962184388938, "3": 6.539367609314072e-05, "4": 1.0801215250110744e-06, "5": 3.08899764316147e-07}, "score": 1.0301148892385301}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.969825626635278, "3": 0.02172160264578827, "4": 0.00782899053518596, "1": 0.0005256213349542584, "5": 9.81892322340918e-05}, "score": 2.037148528949208}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5488503835633043, "4": 0.44970673889739404, "3": 0.0012118162642263573, "2": 3.1591707047919993e-06, "1": 0}, "score": 4.547757083949785}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8311554897644358, "4": 0.16866504719829722, "2": 0.00010344370564928386, "3": 7.411793627200298e-05, "1": 0}, "score": 4.830876064240746}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6839883114698281, "5": 0.2283382949308376, "2": 0.06841458815322675, "3": 0.018710928763055856, "1": 0.0005475305493120668}, "score": 4.071155622842754}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"5": 0.534381380096775, "4": 0.4630758108326941, "3": 0.0025108824849535394, "2": 3.1242350367106215e-05, "1": 0}, "score": 4.531808376793104}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5575849001376314, "4": 0.4145215978392798, "2": 0.026524710732714757, "5": 0.0013000347293329266, "1": 6.819236155822032e-05}, "score": 3.3904607921398915}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9079394932419022, "5": 0.07786095276306394, "3": 0.014196771491196048, "2": 2.3185234937459187e-06, "1": 0}, "score": 4.063659573761672}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9865903068826704, "4": 0.0073222911598769674, "3": 0.004215317348877917, "1": 0.0016750593190064016, "5": 0.00019680286805541516}, "score": 2.0177752529073905}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.935315213284814, "4": 0.06447682642303824, "3": 0.0002032089089425138, "1": 0, "2": 0}, "score": 4.935116447472455}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7169161075785542, "5": 0.2611238664863597, "3": 0.020974234984991916, "2": 0.0009538024341962297, "1": 3.1751740983592845e-05}, "score": 4.238146827797219}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8029298811150156, "1": 0.1956594169248443, "3": 0.0014075805084176642, "4": 3.002020487978431e-06, "5": 1.1836994377196805e-07}, "score": 1.8057545225282297}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8077619501660712, "3": 0.11874651308419715, "5": 0.07306138505648058, "2": 0.0004292742353607721, "1": 0}, "score": 3.9534562826614095}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.8317654158668525, "4": 0.16280944681142479, "5": 0.005402472282994517, "2": 2.1478180470259928e-05, "1": 0}, "score": 3.17359311922737}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6469587967813981, "5": 0.3521239622136588, "2": 0.0006434874717741848, "3": 0.00027061862934802034, "1": 0}, "score": 4.350567467636055}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4274634035502975, "3": 0.40905706886330334, "2": 0.14654981121810987, "5": 0.016449371651129925, "1": 0.00048010823014992725}, "score": 3.3128521931596273}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6173102284878863, "5": 0.3574271549457362, "3": 0.0152718853467867, "2": 0.009988476504533432, "1": 1.6919108285020031e-06}, "score": 4.322173422177961}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9838692409237508, "4": 0.01606860356534625, "3": 4.993212374041091e-05, "2": 6.59870592583284e-06, "1": 3.642665004896898e-06}, "score": 4.983797133295031}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6909660556069591, "4": 0.30902268207652267, "3": 9.821801502796195e-06, "1": 0, "2": 0}, "score": 4.69095722913972}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8017348233439581, "4": 0.19190068622957884, "2": 0.004691419861580061, "3": 0.0011768310546048913, "1": 0.0004946710310829556}, "score": 4.7896923780890095}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8359280618655862, "2": 0.1570800077396975, "3": 0.005355345810731644, "4": 0.0013815585956321263, "5": 0.0002546559855253053}, "score": 1.1729540630836508}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7296161828694516, "4": 0.2678482205859973, "3": 0.002391075534092798, "2": 0.00014377816026163142, "1": 0}, "score": 4.726938091020939}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9782801950244684, "4": 0.019749312467758753, "3": 0.001940328481265511, "2": 2.9395763283714827e-05, "1": 0}, "score": 4.976281825058057}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6315012991178262, "5": 0.1801286249912997, "4": 0.09266355811906386, "2": 0.08340314170526722, "3": 0.012298069255777672}, "score": 2.1065103265801257}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8492762268937377, "4": 0.05496750425977029, "1": 0.04994396510027842, "5": 0.037855897455282186, "3": 0.00795571532342489}, "score": 2.1815145765292083}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7991937675812177, "5": 0.15451231145904834, "3": 0.039418319847299745, "2": 0.006247767993854446, "1": 0.0006275928059285796}, "score": 4.100715701409512}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8686230867232059, "3": 0.0884147736999041, "1": 0.036649822271734245, "4": 0.006257776804496725, "5": 5.43934399787331e-05}, "score": 2.0644436948342335}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6537458902808818, "3": 0.26768646233993887, "2": 0.059274172943512796, "5": 0.018108008137889584, "1": 0.0011848204913058576}, "score": 3.6283184984026886}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7706048137914708, "5": 0.1780670703396966, "3": 0.04992868957786452, "2": 0.0013940688188001265, "1": 4.837250873270623e-06}, "score": 4.125335796573962}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9908963633217096, "2": 0.008483017968340957, "3": 0.0004804860799022987, "4": 0.00010349740686677623, "5": 3.649358741758798e-05}, "score": 1.0099004581006752}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3641768782909858, "3": 0.33453887096228196, "2": 0.22983378620126146, "5": 0.048919783195022486, "1": 0.022473363848642337}, "score": 3.1872466632934464}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9209830378476094, "4": 0.07762984695761672, "3": 0.0008814037949255695, "1": 0.0003941099999269902, "2": 0.00010325664188583446}, "score": 4.918720457269051}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4904355770446518, "3": 0.26557321861281213, "2": 0.1809122087344408, "1": 0.032302966850987595, "5": 0.03076878429049141}, "score": 3.306457223308342}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9686481687196814, "4": 0.027725869074420532, "1": 0.002732643017091435, "3": 0.00045082018538193755, "2": 0.00042620973379450783}, "score": 4.959162624074039}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.995937825243842, "4": 0.003251032307494389, "3": 0.0005049211396459244, "1": 0.00020781526955935411, "5": 9.818726846908491e-05}, "score": 2.0070937338423858}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"5": 0.979892992113782, "4": 0.020088523442383904, "3": 1.613914291003473e-05, "2": 9.589153835516372e-07, "1": 0}, "score": 4.979876293626431}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.895007075635986, "2": 0.10492945623445542, "3": 6.188578804689255e-05, "4": 1.0924966241547228e-06, "5": 4.798789271333313e-07}, "score": 1.1050584258631384}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5867887527439606, "3": 0.23892898621730996, "2": 0.1354871875445437, "1": 0.02613855112050314, "5": 0.012654947924592949}, "score": 3.424335026901493}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9939905026989815, "1": 0.003501865333594214, "3": 0.0023696886589410263, "4": 0.00013543862124669722, "5": 2.4289754865202508e-06}, "score": 1.9991459874296413}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990574177100335, "4": 0.0009412616516648405, "3": 2.4394549933101676e-07, "1": 0, "2": 0}, "score": 4.99905824944336}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.87617248214649, "4": 0.11925112682405592, "1": 0.0023020068339171355, "3": 0.0018525881825697077, "2": 0.00041984036595310944}, "score": 4.8665758874468095}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8924564071951928, "2": 0.09899334037990984, "3": 0.004441488548737456, "4": 0.0025870483146894748, "5": 0.001521105356786041}, "score": 1.1217219581239064}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.991352008871262, "4": 0.008575943181218276, "3": 4.226019210494578e-05, "1": 2.396902946279491e-05, "2": 3.1502932948026185e-06}, "score": 4.991234186045852}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6366259064129124, "5": 0.3173113850529437, "3": 0.0313044881606995, "2": 0.014597536461777116, "1": 0.00015937924613353358}, "score": 4.256334020660452}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5458210850476338, "3": 0.23060704981429925, "2": 0.13280438804210024, "5": 0.08424285672425372, "1": 0.0065229535966400765}, "score": 3.56845745075147}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9699212687654986, "2": 0.030015120728926904, "3": 6.132481405182635e-05, "4": 1.8579626872246076e-06, "5": 4.3527535766289334e-07}, "score": 1.0301450851190321}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9570935738418758, "4": 0.04266797244582096, "3": 0.0002354402246190629, "2": 2.505409158597435e-06, "1": 0}, "score": 4.9568536089557105}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8013535768678073, "3": 0.17149437701469109, "5": 0.02652287793852689, "2": 0.0006283853280259208, "1": 4.79163481629114e-07}, "score": 3.8537702483691954}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9748206272115001, "4": 0.025166777687025778, "3": 1.1291289163569338e-05, "2": 2.119895194612418e-07, "1": 0}, "score": 4.974809976263047}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7524363881140648, "3": 0.12094874719745022, "1": 0.10869646566119566, "4": 0.017584648533105512, "5": 0.00033324919983620393}, "score": 2.0484213504753233}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9980379645130097, "4": 0.001958313765020315, "3": 2.779342969781695e-06, "1": 3.42016792572515e-07, "2": 0}, "score": 4.998034758302012}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5004491919325997, "5": 0.49571436259786494, "3": 0.003720735184430905, "2": 0.00010881384280196314, "1": 6.5807620912150206e-06}, "score": 4.491756412679324}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9996781751567282, "4": 0.0002974608316397779, "1": 1.9275301434731323e-05, "3": 2.231075057711023e-06, "2": 0}, "score": 4.999620974729389}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9080328569202726, "4": 0.08798417589925603, "1": 0.003874923725935889, "3": 7.037401275154833e-05, "2": 3.5997034424448346e-05}, "score": 4.896267216584754}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7963480818215998, "4": 0.20360054856139362, "2": 2.709869462657067e-05, "3": 2.0692505011452223e-05, "1": 0}, "score": 4.796276041335352}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5490312595623728, "4": 0.4368684539114494, "5": 0.013377331281075057, "2": 0.0007209481047775074, "1": 0}, "score": 3.4629030974802957}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9608250793367935, "4": 0.03734429960755758, "3": 0.0017665344314786579, "2": 6.359638047551628e-05, "1": 0}, "score": 4.958931822254644}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7072176149156073, "5": 0.18549717985281453, "4": 0.09921677263516818, "3": 0.008066678238208322, "1": 0}, "score": 2.762993101630194}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9934753505676187, "4": 0.0039668033902362084, "1": 0.002550771797294783, "3": 3.4283892962834077e-06, "2": 0}, "score": 4.98582320095543}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998542255043888, "4": 0.0014454718079770527, "3": 5.954254809089367e-06, "1": 5.346817681089967e-06, "2": 0}, "score": 4.998521230974206}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5274512367948607, "3": 0.3302204226747545, "1": 0.11130285162051112, "4": 0.03082255967924701, "5": 0.00020218650387904063}, "score": 2.2811694587564526}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.580273926421745, "5": 0.2677626299728066, "2": 0.12404709339919141, "3": 0.026915116460628424, "1": 0.001000386653713421}, "score": 3.9897521580717914}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8426218062959684, "2": 0.10919732634404099, "1": 0.029600974378539865, "4": 0.015258096481431572, "3": 0.003316851464805924}, "score": 4.5321100103102}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997585856551338, "4": 0.00020049825790670735, "1": 2.2692433841148125e-05, "2": 1.4120569413177368e-05, "3": 3.102783332826142e-06}, "score": 4.999660164391886}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9744778372321657, "1": 0.02279432676683683, "3": 0.001932820391580086, "4": 0.0005369726477721749, "5": 0.0002576331201468773}, "score": 1.9809853304877276}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5030342096311123, "3": 0.4739596677700805, "4": 0.022744898511130485, "5": 0.0001655080042944093, "1": 9.573055801237186e-05}, "score": 2.5198502507225724}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7833175340604318, "1": 0.18977737582314666, "3": 0.026546005356402686, "4": 0.0003532010911192999, "5": 4.997086576784219e-06}, "score": 1.8374898788966245}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9988504400508519, "3": 0.000646443536995684, "5": 0.000407165956541986, "1": 6.011476937149327e-05, "2": 3.449065983503707e-05}, "score": 3.9995113961345763}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.44730788084385786, "3": 0.40771914977500096, "4": 0.13773289677510792, "1": 0.003913759726947556, "5": 0.0033244301600424023}, "score": 2.689245771734537}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7494624970371987, "5": 0.2134102946887374, "3": 0.024659686357519424, "1": 0.008896410484022007, "2": 0.003565175491857371}, "score": 4.1549319455622715}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7778300448634808, "3": 0.20249926946951521, "2": 0.015932490930838414, "5": 0.003727013635198596, "1": 1.0733766905237168e-05}, "score": 3.7693304578169484}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8505752616476557, "1": 0.09175951423862112, "3": 0.05223923176493818, "4": 0.005369899960309374, "5": 5.609650762764766e-05}, "score": 1.9713878070876765}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9787253511543689, "4": 0.02121082530575802, "3": 5.6217694604826206e-05, "2": 2.305677496440566e-06, "1": 0}, "score": 4.9786697092184236}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7108708224523839, "4": 0.2285152799969107, "3": 0.045708637251559256, "5": 0.014900477791518174, "1": 4.372284135238261e-06}, "score": 2.547436482907106}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8285112859995772, "4": 0.16900170083454036, "3": 0.0024711590188484, "2": 1.5052145782834346e-05, "1": 0}, "score": 4.8260106851507665}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7446742831719971, "5": 0.11266986330952199, "2": 0.0830146650038034, "3": 0.05957191743079392, "1": 6.124483736562664e-05}, "score": 3.8868839734619103}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9414663202145805, "4": 0.057705741751171484, "3": 0.0007808875504414091, "2": 4.332052572740994e-05, "1": 3.4273986349342404e-06}, "score": 4.940588794000802}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999444975683012, "4": 0.0005514336691670406, "3": 1.1071427061887351e-06, "1": 0, "2": 0}, "score": 4.99944635067043}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5791630701752111, "4": 0.4192629459182676, "3": 0.0014716854063922917, "2": 0.0001013719634109516, "1": 0}, "score": 4.577489175906923}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9592098023727507, "5": 0.036336715594383895, "3": 0.004424029263804332, "2": 2.914043002789985e-05, "1": 0}, "score": 4.031854415419901}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5483345421085071, "5": 0.40890150541373005, "3": 0.023934580091338423, "2": 0.018756607287000217, "1": 7.205736644567523e-05}, "score": 4.3472377844006855}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8990745162630339, "1": 0.05920094348337504, "3": 0.040212917665962335, "4": 0.0014897667722022362, "5": 2.1850975327602843e-05}, "score": 1.9840570605758094}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7616273232747091, "3": 0.2338131936932029, "4": 0.004060157146837286, "1": 0.00046841415818512256, "5": 3.088641854407064e-05}, "score": 2.2415577591977947}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9999909853566321, "3": 5.301578243192208e-06, "5": 2.544812715154174e-06, "1": 0, "2": 0}, "score": 3.9999972432312516}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.507556400627382, "5": 0.2936872363037223, "1": 0.16832773438622153, "3": 0.022318474289736927, "2": 0.008107209917078704}, "score": 3.750170403403948}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8263612354576384, "3": 0.10202735656906511, "5": 0.06354093723085645, "2": 0.008063867490643514, "1": 6.0279594750979706e-06}, "score": 3.945367730372554}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8341594231792262, "2": 0.13297319665231888, "4": 0.015794713240083264, "3": 0.014702540161847326, "5": 0.002368914608104238}, "score": 1.219238340880281}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.48821241070130966, "4": 0.2592629192348379, "2": 0.22515187601042602, "3": 0.027368099381785867, "1": 4.175890203478741e-06}, "score": 4.010528037089811}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5014015660039787, "5": 0.4962997500577956, "4": 0.0021064390736235746, "3": 9.460171056381453e-05, "2": 8.91299625495114e-05}, "score": 2.991813607526381}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5031658356892901, "1": 0.4966497150822932, "4": 0.00017242572395321474, "3": 7.018654675211051e-06, "2": 1.9209398240381933e-06}, "score": 3.013202786714328}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5389824871359373, "1": 0.4607049788303536, "3": 0.0003108991421968587, "4": 1.5501466788411178e-06, "5": 8.129730254267265e-08}, "score": 1.5396092629098974}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8466005595141575, "3": 0.10653312599390093, "5": 0.044266017306339826, "2": 0.0025768764288855964, "1": 1.876213152696879e-05}, "score": 3.932522537707881}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5557321196637409, "3": 0.3274629041805614, "2": 0.0851169062326792, "5": 0.030607475575720695, "1": 0.0010801719905670297}, "score": 3.529670044311078}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7928997611022662, "4": 0.2058512002667263, "3": 0.0010948419106195577, "2": 9.415558352993178e-05, "1": 5.88984372450987e-05}, "score": 4.791440817091966}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.46445525720832415, "2": 0.32736651329100575, "4": 0.19786145805293803, "5": 0.009020751802395612, "1": 0.001295212117430902}, "score": 2.8859459320300194}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3531149632995174, "2": 0.31986088886639824, "3": 0.1776786317619432, "4": 0.14181184999568164, "5": 0.007526927161044606}, "score": 2.1307690311783625}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9991665387819118, "3": 0.00074756522423828, "4": 6.222821771993621e-05, "1": 2.3414899674638045e-05, "5": 9.115841679873148e-08}, "score": 2.0008488803725335}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3117793976720522, "5": 0.273426317299433, "4": 0.27293860478127796, "3": 0.08612360044983271, "2": 0.05572332268659508}, "score": 3.140510351814165}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5126357320550784, "2": 0.268999623233564, "4": 0.1966422482303022, "1": 0.019426299240447566, "5": 0.0022918720644278506}, "score": 2.893373320128191}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5402790033407702, "1": 0.3332501066144631, "3": 0.12067123468928262, "4": 0.005639166545571221, "5": 0.00016022443610095888}, "score": 1.7991800813827374}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.835836850372065, "3": 0.14971215427059728, "4": 0.008786041588001661, "1": 0.0055179989139862076, "5": 0.0001468427898889484}, "score": 2.1622067850800595}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6224459572964486, "3": 0.21675447882120555, "1": 0.07991766194597626, "4": 0.0731820212149512, "5": 0.007695958177115397}, "score": 2.3062899352723183}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7615450491190943, "5": 0.1849538212366191, "3": 0.05328295993273562, "2": 0.0002094140846187863, "1": 0}, "score": 4.131253182338544}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7012341394087102, "5": 0.29866324834925634, "3": 0.0001012282186059305, "2": 6.308119738693711e-07, "1": 0}, "score": 4.298560983386255}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7858856740459287, "1": 0.15952843448702386, "3": 0.0407589064494512, "4": 0.013364604794657382, "5": 0.0004599333363322715}, "score": 1.9093392597241876}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8761719301580001, "1": 0.06437211735192946, "3": 0.05216832860159291, "4": 0.007246304240632992, "5": 4.078186747387476e-05}, "score": 2.002411166630029}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5158813560882884, "1": 0.4829794368719169, "3": 0.001128976622958722, "4": 9.890716183870235e-06, "5": 1.7495308231947068e-07}, "score": 1.5181697666622964}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9999845484373766, "4": 7.351273459142403e-06, "3": 4.2025713240216925e-06, "5": 2.5267466292966207e-06, "1": 7.76404647273776e-07}, "score": 2.000025708968769}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999552252224203, "3": 3.788891382042922e-05, "4": 4.970058238084228e-06, "1": 4.7025581644784013e-07, "5": 0}, "score": 2.00004735884294}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9999390143796986, "3": 2.855886963164682e-05, "4": 2.191042515358456e-05, "5": 5.355100964467522e-06, "1": 4.684604800722459e-06}, "score": 2.0000837604579536}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6438222501880833, "1": 0.3541162605972806, "3": 0.0020535238711884376, "4": 7.5894229281042815e-06, "5": 2.2490314366992964e-07}, "score": 1.647953063663991}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8747048096004428, "1": 0.12315420618810947, "3": 0.0021278429753595193, "4": 1.2680324725709793e-05, "5": 3.318967202535827e-07}, "score": 1.8789999775160877}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8233909423586091, "3": 0.12270354942678617, "1": 0.043831646485213246, "4": 0.009777142651954436, "5": 0.00029650365869217886}, "score": 2.0993157206160267}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7740938186592742, "2": 0.22542199501374474, "3": 0.0004792975324734633, "4": 4.31680073788353e-06, "5": 0}, "score": 1.226393669976674}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9760455183527892, "2": 0.023650540740826956, "3": 0.0002517877719708651, "4": 4.021389400652427e-05, "5": 1.1013365249794974e-05}, "score": 1.0243188339439915}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8024931338216914, "5": 0.1070545030401741, "3": 0.08470679129160383, "2": 0.00563210678444418, "1": 0.00011316088395628998}, "score": 4.010744018795909}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9921821892919496, "4": 0.007812116133802926, "3": 5.457389478679636e-06, "1": 0, "2": 0}, "score": 4.992176967231735}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7008250465910286, "3": 0.203901142129011, "5": 0.07424610207379405, "2": 0.02066432697295605, "1": 0.0003627915975489126}, "score": 3.827927829574264}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8279270188227393, "3": 0.09469836916546541, "5": 0.05088958465692417, "2": 0.026476913880595292, "1": 7.847637710945588e-06}, "score": 3.903213819087829}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.949093715883249, "4": 0.050746775501248904, "3": 0.00015785684183455085, "2": 9.852425326917447e-07, "1": 0}, "score": 4.948934521050752}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9964815597680055, "3": 0.0031708439380840623, "4": 0.00022153277744307154, "1": 0.00011731475753860506, "5": 8.721851627340161e-06}, "score": 2.003522760385101}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5833577759394788, "2": 0.3659643700169584, "4": 0.02415205522548532, "3": 0.023099257611526095, "5": 0.00342529390250203}, "score": 1.4983208480840864}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9996537502582826, "4": 0.0003281906068233992, "3": 1.745320951268196e-05, "1": 0, "2": 0}, "score": 4.999636902754141}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9997640677363949, "1": 9.803823522768333e-05, "4": 7.1942814326035e-05, "5": 4.543072135203317e-05, "3": 2.0448357429443452e-05}, "score": 2.000202587929524}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7563874228350077, "5": 0.24302965647044242, "4": 0.00046469401557307585, "2": 6.0271572493099476e-05, "3": 5.463089460398445e-05}, "score": 1.9736854780270234}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9429055692652031, "2": 0.05617502589166702, "3": 0.0007759017163426435, "4": 0.00010672362595864873, "5": 3.6470166053528236e-05}, "score": 1.0581928988675295}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6393568242824732, "2": 0.3603073001944358, "3": 0.0003335669377016927, "4": 2.0316343303061105e-06, "5": 1.6710792095249053e-07}, "score": 1.3609812370558259}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.741129874361511, "2": 0.2025761527837357, "4": 0.05626731854725625, "5": 1.6439542453814943e-05, "1": 9.500092714351317e-06}, "score": 2.853704940109969}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9996778176818734, "1": 0.00022203112127360092, "3": 9.667719652647853e-05, "4": 3.22663099717347e-06, "5": 0}, "score": 1.9998810993078349}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9954230219348432, "5": 0.00449557499698165, "3": 7.006094863247931e-05, "2": 9.361977672465459e-06, "1": 0}, "score": 4.004406798819091}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9765718502569852, "3": 0.01843370309352327, "4": 0.003965909770102475, "1": 0.0010241379957189923, "5": 4.364255257796357e-06}, "score": 2.025354478281767}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9745804093458846, "4": 0.025304424933103226, "1": 8.040260353721338e-05, "3": 2.5810710926464035e-05, "2": 7.264972835794623e-06}, "score": 4.974300504946193}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9969148752082618, "4": 0.0030741083108113574, "3": 5.007248476619871e-06, "1": 2.9960554034709343e-06, "2": 2.3921930945204953e-06}, "score": 4.996896714464247}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.602060885550074, "5": 0.3103793561914325, "2": 0.03873842800156262, "1": 0.03279777504128633, "3": 0.01601982437918026}, "score": 4.118489792751307}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6758709794208071, "4": 0.3237327011944427, "3": 0.0002027882959886858, "1": 0.00015120938893738528, "2": 4.015217287929084e-05}, "score": 4.675135723337391}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.784433647292901, "2": 0.21415464173458454, "3": 0.0013324319135536542, "4": 6.448931543854216e-05, "5": 1.4413143854900754e-05}, "score": 1.2170707078321832}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7696964982130695, "3": 0.20515795178737722, "4": 0.01835112680683173, "1": 0.00654288551874908, "5": 0.00025136436954372083}, "score": 2.236071453903151}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9679840104230427, "3": 0.0207533831961153, "4": 0.010737794122103786, "1": 0.0004518956353661852, "5": 7.291610677051022e-05}, "score": 2.041995824146963}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4572782871423653, "4": 0.36033969327677057, "2": 0.1652050911947464, "5": 0.008834542122179842, "1": 0.00834170539251832}, "score": 3.1961204090741284}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9938423537903023, "2": 0.006155491307680578, "3": 2.089353228349655e-06, "4": 3.5563820284448985e-08, "5": 0}, "score": 1.0061597768902986}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9294641757346604, "5": 0.052656973448946334, "3": 0.017732971068133947, "2": 0.00014513880464846936, "1": 3.1069705474803984e-07}, "score": 4.034632807580998}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.49648693998598503, "1": 0.40312245686658715, "3": 0.08421378110885246, "4": 0.015794744829541338, "5": 0.00038096258109873444}, "score": 1.7138233826641922}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6109126209128768, "3": 0.269334386194176, "4": 0.08036296847571099, "1": 0.03694565610253144, "5": 0.0024440550826930105}, "score": 2.400446957723952}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6238939668321916, "1": 0.26333170651484233, "4": 0.10076582686714598, "3": 0.006115308875490513, "2": 0.005868025928997111}, "score": 3.816042857276117}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9608300189512237, "5": 0.03859812418251856, "3": 0.0005683443914541373, "2": 1.9908437780977127e-06, "1": 0}, "score": 4.038025855964831}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9865060753981619, "2": 0.01348238851033683, "3": 1.1425955411973043e-05, "4": 9.758744393599738e-08, "5": 0}, "score": 1.0135055333529688}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.862951110621442, "2": 0.13635703170861502, "3": 0.0006312489757186132, "4": 4.719040358126963e-05, "5": 1.3386430678532176e-05}, "score": 1.1378146509842801}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8216743502501151, "4": 0.17133060953107526, "3": 0.005440354798111218, "1": 0.0010582859584254546, "2": 0.0004940306490942547}, "score": 4.812072999927763}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.46235117851245955, "4": 0.29221033812114877, "3": 0.2132366920394187, "1": 0.026970853393669947, "5": 0.005230224899570153}, "score": 2.7863777503006197}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4859167577993651, "4": 0.21084879790320718, "5": 0.19400493152692816, "3": 0.07339017558029293, "2": 0.03582541576113507}, "score": 2.5911940384340006}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"4": 0.479867161623174, "3": 0.3138976505094274, "2": 0.20492438941520016, "5": 0.00118976912891032, "1": 0.00012068508600567834}, "score": 3.2770810356754057}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.889234392157538, "3": 0.09755228385884944, "1": 0.010069109571944129, "4": 0.003139152248715052, "5": 5.1149496612856e-06}, "score": 2.09377681868315}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9880088734993054, "4": 0.011919149149119963, "3": 7.096945391828233e-05, "1": 0, "2": 0}, "score": 4.987938899786689}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8944366770383116, "2": 0.059097893392637685, "3": 0.023973033128831842, "5": 0.015263086694836418, "4": 0.007228083167669047}, "score": 1.1897807887135396}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9458923134236648, "4": 0.05239486440480934, "1": 0.0012098914913075565, "3": 0.0004260009421830709, "2": 7.620503662614833e-05}, "score": 4.941684910374687}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6494168711852664, "3": 0.2932336932456896, "5": 0.039391587527743376, "2": 0.017882244245987288, "1": 7.537031957768494e-05}, "score": 3.710167227162426}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5163779605233088, "5": 0.4801691698423642, "3": 0.0030277100629181137, "2": 0.0004247068040224543, "1": 0}, "score": 4.476292261821004}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9786923481132535, "4": 0.020932317969378625, "3": 0.0003747527810231613, "2": 2.2230022585163755e-07, "1": 0}, "score": 4.978317501787434}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9865582757751565, "4": 0.009241368483684897, "5": 0.003186593822169634, "3": 0.0008297108428344086, "1": 0.00018391240012454325}, "score": 2.028688320854971}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.92029205337019, "4": 0.07943144153549626, "3": 0.00026743393342038214, "2": 7.999856131569157e-06, "1": 4.696937266880466e-07}, "score": 4.9200077641301485}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8379252189598809, "2": 0.16172970902380504, "3": 0.0003374694062191651, "4": 5.649107442861626e-06, "5": 1.3818588118917076e-06}, "score": 1.1624272154443367}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8783517316887102, "3": 0.08107355094234803, "5": 0.03023234201458398, "2": 0.010339852241440918, "1": 2.2319029401201235e-06}, "score": 3.928472370050974}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7539634401609151, "5": 0.14933781866249102, "3": 0.08690319334783989, "2": 0.009509100419609944, "1": 0.0002855369828869977}, "score": 4.042559852274376}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987849060252392, "4": 0.0012116393519666893, "3": 2.0694907405761176e-06, "1": 0, "2": 0}, "score": 4.998784219982537}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9091069908734458, "3": 0.05700730280318771, "5": 0.02958402675392879, "2": 0.003514630078790832, "1": 0.0007861845473723969}, "score": 3.96318887831151}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5307643189782987, "1": 0.4682120721894715, "3": 0.0009578091662432726, "4": 6.033983854445693e-05, "5": 5.399166328087144e-06}, "score": 1.5328825858169821}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5218615271237936, "5": 0.4317382228648513, "4": 0.039636042917308684, "2": 0.004497599360495328, "3": 0.0022651053703576698}, "score": 2.854891617033435}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9930197436547831, "4": 0.004417003738407923, "3": 0.0021610598636785682, "5": 0.00020127146277959513, "1": 0.00020089262432160156}, "score": 2.0113979894311327}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9713787402407221, "4": 0.016896029930585706, "5": 0.004699355064503957, "1": 0.004674752774966101, "3": 0.0023508192372058722}, "score": 2.0455662053121837}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.503717542277783, "4": 0.49625632572950756, "3": 1.799547896909107e-05, "1": 0, "2": 0}, "score": 4.503703645190444}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6034177114119139, "4": 0.37969057662527755, "3": 0.010703922670261748, "2": 0.004474040337381966, "1": 0.0017117312392596483}, "score": 4.578631681863457}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6926557475492153, "1": 0.2603246950466688, "3": 0.03579576101458574, "4": 0.01101932201819275, "5": 0.00020376320461843635}, "score": 1.7981208560484294}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9997948118239739, "3": 0.00010658039233189519, "4": 8.240874483842256e-05, "5": 9.771183139589494e-06, "1": 4.816254532122494e-06}, "score": 2.0002958956537613}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.994017595273339, "5": 0.004960192641437596, "3": 0.0010220115355841404, "2": 5.1505924348481286e-08, "1": 0}, "score": 4.003938078680951}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9749521666830678, "5": 0.023303884862794316, "3": 0.0017410567892055596, "2": 2.4428968237562267e-06, "1": 0}, "score": 4.021557951954462}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9031892304398932, "3": 0.08505122133869891, "1": 0.009172852246676194, "4": 0.002582140688124718, "5": 4.5035120951680315e-06}, "score": 2.081056165201201}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7897974964403166, "2": 0.20221869878297122, "3": 0.007523224071408584, "4": 0.00045106337827898434, "5": 9.225187897061175e-06}, "score": 1.218655301689983}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.970926667694036, "4": 0.01853253579432404, "3": 0.010533148443960421, "2": 3.0724569714941625e-06, "1": 0}, "score": 4.960391768714993}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9992214107180541, "4": 0.00047126688010128197, "5": 0.0002537616797743945, "2": 4.4937766142368304e-05, "1": 7.969689695383208e-06}, "score": 3.0009179136937587}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5464476868052449, "2": 0.31380267945022916, "4": 0.07625784374487507, "3": 0.06007907306444817, "5": 0.0034071957047339834}, "score": 1.676366874010079}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"1": 0.967847766582802, "2": 0.03211798260305997, "3": 3.373154854242949e-05, "4": 3.151081259612972e-07, "5": 9.972953152268001e-08}, "score": 1.0321867933038493}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.9864432014506286, "5": 0.008667216407550709, "4": 0.004824971263308055, "2": 6.419639509584214e-05, "1": 1.0814769475836405e-07}, "score": 3.022094998156412}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8014957576176499, "3": 0.19356616247885372, "4": 0.0028694078343334713, "1": 0.002050462298074106, "5": 1.817221097936441e-05}, "score": 2.197309039893334}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.98773165043312, "4": 0.009389643053089428, "3": 0.0019891212911484655, "5": 0.0008857856204604266, "1": 3.6387439665447854e-06}, "score": 2.0234221292823835}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9954725260503575, "5": 0.004513775211046008, "3": 4.4169948115734914e-06, "1": 0, "2": 0}, "score": 4.00450940007133}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9951974655246226, "4": 0.004025952701881864, "5": 0.00047988311218427593, "3": 0.0002896648479616813, "1": 7.015721490635099e-06}, "score": 2.009774204043621}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7147011040381116, "2": 0.279782769537421, "3": 0.00480562582742215, "4": 0.0006666669247269174, "5": 4.381203529070171e-05}, "score": 1.2915692764163014}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.8584769741751882, "2": 0.14139477190513422, "4": 7.027868539997226e-05, "5": 5.755468607270582e-05, "1": 0}, "score": 2.8587905567670333}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9994822480798075, "4": 0.00026960301385532833, "3": 0.00022724768772180838, "5": 2.0894888464133214e-05, "1": 0}, "score": 2.0008291383860737}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8792998528027133, "4": 0.08065305462908641, "5": 0.03414257635677166, "3": 0.005904066076071886, "1": 0}, "score": 2.2696380257781685}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"2": 0.996445106548478, "3": 0.0032450169675850007, "1": 0.00029978350314816975, "4": 9.926416710157979e-06, "5": 6.075217213842141e-08}, "score": 2.0029652688681345}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9424117349177914, "1": 0.04180648533212205, "3": 0.015227208780709474, "4": 0.00054126747109997, "5": 1.3239735301355656e-05}, "score": 1.9745429759734758}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5927988766452185, "5": 0.3915636096473105, "3": 0.014957452625186584, "2": 0.000618712779644874, "1": 5.920236899899813e-05}, "score": 4.37519192949282}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.3741730455270342, "1": 0.22446775778456252, "4": 0.19673957089036706, "3": 0.18493397675627582, "5": 0.01968107627663512}, "score": 2.412990478090808}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4183077555772617, "3": 0.32708339827692245, "2": 0.24188008310444925, "5": 0.009880644861200839, "1": 0.002847189248333378}, "score": 3.190494760655194}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5683200219476019, "5": 0.35494213599123453, "3": 0.07096690055550145, "2": 0.005634666595312014, "1": 0.00013525847235749922}, "score": 4.272300403604512}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.612208419320532, "4": 0.36830775483375133, "3": 0.01923721297512346, "2": 0.00024063218346663374, "1": 5.331121122355129e-06}, "score": 4.592474333466294}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9708061016230785, "4": 0.028625126439988113, "3": 0.0005669202027678011, "2": 7.870067592013555e-07, "1": 0}, "score": 4.970238640446463}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9339534419640282, "5": 0.06492741015379253, "3": 0.0010850306972430813, "2": 3.203197292757287e-05, "1": 0}, "score": 4.063778448502281}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9753443898431147, "4": 0.018449413456067446, "1": 0.00564286140959444, "2": 0.00028353953252083914, "3": 0.0002775812152580543}, "score": 4.9575732659216305}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8249297481754234, "4": 0.11703720538387685, "5": 0.028523590421578475, "1": 0.01569939660765291, "3": 0.013809293105749096}, "score": 2.317755322028306}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8698697249349143, "5": 0.09825206604559189, "3": 0.026335661702755024, "2": 0.004697372355047859, "1": 0.0008446248446666654}, "score": 4.059987818099061}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999928763541437, "1": 6.395358321500875e-05, "4": 5.6302540077552025e-06, "3": 2.7740258789489073e-07, "2": 0}, "score": 4.999738000247649}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999828796125555, "4": 9.115347742366811e-06, "1": 7.106412588934219e-06, "2": 0, "3": 0}, "score": 4.999962458968167}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8408470940386704, "2": 0.08651600960769593, "3": 0.05826818770457158, "1": 0.013529056136820265, "5": 0.0008378168813804067}, "score": 3.7289499440031086}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9761962470347116, "3": 0.019091476501453635, "1": 0.004304873181313993, "4": 0.00040531419560954797, "5": 2.122860683212582e-06}, "score": 2.0156035997664157}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8882113567080608, "4": 0.09268543856802113, "2": 0.018426821233711338, "5": 0.0006544417341697379, "1": 2.1660851609779348e-05}, "score": 3.0755242003145122}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991804631039529, "4": 0.0008133174965415622, "3": 5.471930930904014e-06, "1": 0, "2": 0}, "score": 4.999175738025487}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9575240105014657, "4": 0.023095204047525915, "2": 0.01886644559668414, "5": 0.0005138991592428615, "1": 3.4314937120969126e-07}, "score": 3.005255870983273}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.956854286339799, "3": 0.034725749732710025, "5": 0.005392457829202335, "4": 0.0030251197545558555, "1": 1.6843143347038687e-06}, "score": 2.0569517183968746}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.58078903196944, "4": 0.40299507417539215, "3": 0.014504311919555115, "2": 0.0016809502844132456, "1": 3.0204428658907318e-05}, "score": 4.56283244664979}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7686462717671669, "4": 0.19730342633238954, "3": 0.018980772232200075, "2": 0.014028443946991284, "1": 0.0010366930413147745}, "score": 4.718501688664992}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8650275784130987, "4": 0.13376635771650375, "3": 0.0011623718071531132, "2": 3.326136648854548e-05, "1": 0}, "score": 4.86380769398908}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.46917363742619594, "5": 0.300680331551861, "1": 0.16825446044356465, "2": 0.03863365852323403, "3": 0.023252584310175378}, "score": 3.695395426009037}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9978159622886955, "4": 0.0021789830540257203, "3": 3.33231266842323e-06, "1": 0, "2": 0}, "score": 4.997814348556193}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7444422713690942, "4": 0.2355129447370479, "3": 0.02004326082868581, "2": 3.4663863407288656e-07, "1": 0}, "score": 4.724399169465548}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9898760299175242, "4": 0.01011450951897817, "3": 6.121098402570546e-06, "2": 1.701747319096388e-06, "1": 0}, "score": 4.989868126449111}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9923252532270359, "4": 0.0076525565303336655, "3": 2.0785789538617636e-05, "2": 1.2302552288127348e-07, "1": 0}, "score": 4.992305492954067}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5813417703906325, "4": 0.2467554040491397, "5": 0.16876177059296787, "3": 0.0031337622482600245, "1": 6.189705804138926e-06}, "score": 3.0029247986589263}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5654221266397307, "4": 0.4231731693095445, "3": 0.010986148796069578, "2": 0.00040057601869169303, "1": 1.6882077529121187e-05}, "score": 4.553584786943908}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6938108542018769, "5": 0.25932789866398054, "3": 0.04299200116547021, "2": 0.003592327348638699, "1": 0.00027661774134266586}, "score": 4.2083214522566905}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5919800523621725, "5": 0.23545901844749892, "2": 0.17152192122338042, "3": 0.001038606882361845, "1": 1.7785539579331375e-07}, "score": 3.891376011304145}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9693848024193229, "4": 0.029558350092634085, "1": 0.0007141720201946529, "2": 0.00020716665334204225, "3": 0.0001344203133901717}, "score": 4.9666945849868}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6450206159396686, "2": 0.2823880189718845, "5": 0.06968388452006521, "3": 0.002904927924004507, "1": 2.2414938882244107e-06}, "score": 3.50199603921645}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9226610853923196, "5": 0.0319480286869845, "2": 0.028275247604692303, "3": 0.017115424577071024, "1": 0}, "score": 3.9582820999837893}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8994842369327182, "4": 0.09628651510937979, "1": 0.0023838620413851024, "3": 0.001547827413526549, "2": 0.0002965748281102535}, "score": 4.890192549398865}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.673568655463286, "1": 0.31316921860857255, "3": 0.013155609939004033, "4": 0.00010332254064282583, "5": 3.1927498198332474e-06}, "score": 1.7002026144517157}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4797580810223123, "4": 0.35182295453040463, "1": 0.11343318429829609, "3": 0.036441293883123976, "2": 0.018541348256396924}, "score": 4.065934744635359}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.968703538231451, "4": 0.020401898882262952, "5": 0.010272369100489936, "3": 0.0005169368696013832, "2": 0.00010135128563962014}, "score": 1.103430802036092}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5359420175368641, "1": 0.2544187111761855, "4": 0.19062895200611596, "3": 0.014833709785534643, "2": 0.004170303767088396}, "score": 3.7495099871666553}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6718485539524097, "1": 0.29342717399269, "3": 0.02566086013234628, "4": 0.008970124709982463, "5": 9.301897996393018e-05}, "score": 1.7504529255628505}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9889531683583044, "2": 0.007337334129087237, "4": 0.0018183877902595224, "3": 0.0015868553316081629, "5": 0.000303567975666748}, "score": 1.0171804918586975}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9999722707254635, "5": 1.1783220853585017e-05, "3": 1.154007266627384e-05, "4": 3.9919009976917625e-06, "1": 0}, "score": 2.0000548735599444}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999763235462916, "1": 9.039849788632101e-06, "3": 6.3720456613833625e-06, "5": 4.11600304581014e-06, "4": 3.11467109119868e-06}, "score": 2.0000159095636416}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9998471291759354, "1": 0.00013472646772164128, "5": 6.663284678651067e-06, "3": 5.396796614259357e-06, "4": 5.089886633737866e-06}, "score": 1.9999008398575924}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7938558208936134, "1": 0.14949774049670864, "3": 0.046424919765755183, "4": 0.00960698347169464, "5": 0.0006143588833506289}, "score": 1.9179842083876129}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.755394159801412, "3": 0.16156752697896876, "1": 0.05089458734897422, "4": 0.031578994829480865, "5": 0.0005646269558584621}, "score": 2.175524828426087}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987264113033415, "4": 0.0012636988035289501, "3": 9.466247316492478e-06, "1": 0, "2": 0}, "score": 4.998717368158457}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7142438630984081, "4": 0.2842599905259758, "3": 0.0014761862132839088, "2": 1.7015259480922584e-05, "1": 0}, "score": 4.71273574530369}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8699756293214971, "4": 0.12992270269784592, "3": 9.998853785457241e-05, "2": 3.564435338356401e-07, "1": 0}, "score": 4.869876078741991}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7756342323373665, "3": 0.12265624405918821, "4": 0.10125671036314868, "5": 0.00045093583559099317, "1": 1.8902943505260936e-06}, "score": 2.3265205777891733}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.833147018159407, "4": 0.1243973003847187, "2": 0.042189614083333105, "5": 0.00025882329184141506, "1": 6.627366780524801e-06}, "score": 3.0827121291612283}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9936100898634143, "4": 0.006378861154425753, "3": 1.0657997592248126e-05, "1": 0, "2": 0}, "score": 4.9935998203480185}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9616676078580323, "4": 0.038270573271462674, "3": 4.636531035499954e-05, "2": 1.4146207372691797e-05, "1": 0}, "score": 4.96159420727579}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8108639701064085, "4": 0.18899804649144733, "3": 0.0001363718789316954, "2": 3.5342200939862517e-07, "1": 0}, "score": 4.8107279113612185}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9581869058391002, "2": 0.04159423928624554, "3": 0.0002140604727323481, "4": 4.147943038383436e-06, "5": 4.3814431260654346e-07}, "score": 1.0420365653949049}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.9422002531844342, "2": 0.057446419522367884, "1": 0.00024678353058181653, "4": 9.276223049453397e-05, "5": 1.3343622534908972e-05}, "score": 2.9421794375718537}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9998206703614823, "3": 8.04830463554561e-05, "4": 5.70504838805377e-05, "5": 3.406203966684449e-05, "1": 7.192498140887928e-06}, "score": 2.0002895777918033}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.999960112362533, "5": 2.1065582719323548e-05, "2": 1.5309010214387592e-05, "4": 2.573875032220025e-06, "3": 4.942976355875929e-07}, "score": 1.000108281609631}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9999882437011058, "2": 8.421724000629574e-06, "3": 1.2294397255967356e-06, "5": 5.703606254186158e-07, "4": 0}, "score": 1.0000131620661543}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9863500678532472, "1": 0.009386422957800131, "3": 0.004231769719556897, "4": 3.1234509521231386e-05, "5": 3.2361477324741724e-07}, "score": 1.9949087857018524}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.710990557398898, "1": 0.20916024464669036, "4": 0.07615120315216425, "3": 0.002200251735360638, "2": 0.0014928764749249264}, "score": 4.078324199945538}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9815051129075245, "4": 0.018414507020201067, "2": 4.404749827693352e-05, "3": 3.3812736734231714e-05, "1": 1.994290918750738e-06}, "score": 4.981377738060964}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8747815945586721, "5": 0.09664697232455532, "3": 0.027642064234562586, "2": 0.0009229236927093474, "1": 6.1005050202927645e-06}, "score": 4.0671407823319}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9703488383209957, "4": 0.029061160122766792, "2": 0.0004884648715093037, "3": 8.611826775393558e-05, "1": 1.4257463984398832e-05}, "score": 4.969244143165155}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9095193962256132, "1": 0.04886892329336379, "3": 0.03981496628756797, "4": 0.001750184619069408, "5": 4.652712882036023e-05}, "score": 1.9945859936055637}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8954853618122094, "2": 0.1044614056204994, "3": 5.268946645022426e-05, "4": 4.7651339643886334e-07, "5": 3.458149930688631e-08}, "score": 1.1045683557663954}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4750271398753708, "2": 0.4357747489419057, "4": 0.08361889229768875, "1": 0.004128764786150706, "5": 0.0014502867260421668}, "score": 2.6424871273976205}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.997089884917899, "4": 0.0027586578603738146, "1": 0.00012586759963930036, "3": 2.0295081335894892e-05, "2": 2.863614270569614e-06}, "score": 4.996688682686016}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.7335561012515641, "4": 0.1755183470403231, "2": 0.08739481701211121, "5": 0.0033979329096410125, "1": 0.0001320436510857822}, "score": 3.094655380306905}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7934537791901537, "1": 0.19347422103747883, "3": 0.012872603315665707, "4": 0.0001839559925288687, "5": 1.5131634584672106e-05}, "score": 1.8198116335194998}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.601251477611068, "1": 0.1671291018928073, "4": 0.11233538200847684, "3": 0.11161966889336192, "5": 0.007658822711938736}, "score": 2.192138864925002}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9905371472630775, "4": 0.008945930883215863, "3": 0.0005123856468223566, "2": 2.6589745952466815e-06, "1": 0}, "score": 4.99002130216702}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.937970565999228, "4": 0.06162267965409801, "3": 0.00029876716509027106, "2": 8.466925578022586e-05, "1": 0}, "score": 4.937524321445143}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4524706861181235, "2": 0.2532482363360007, "3": 0.2098524739787355, "5": 0.08318873807436798, "1": 0.001224456753348684}, "score": 3.3631566082097066}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8627200087465179, "5": 0.12053236173398686, "3": 0.01451718730684218, "1": 0.0012573857688465894, "2": 0.0009621533620444121}, "score": 4.100319804191543}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6233872027572781, "4": 0.3759001986301251, "3": 0.0007086765085066809, "2": 3.2019806067927137e-06, "1": 0}, "score": 4.622672570688699}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.759795318300523, "5": 0.23191371374719433, "3": 0.008223379689290183, "2": 6.470057301533244e-05, "1": 1.8615594640237633e-06}, "score": 4.22355557763068}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6980116959393853, "4": 0.2565149067693863, "5": 0.02951706819705287, "3": 0.014752194907188421, "1": 0.0012034069739374396}, "score": 2.6151302533939296}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982436609717154, "4": 0.0017554413011969642, "3": 2.436129844966002e-07, "1": 0, "2": 0}, "score": 4.998244070324255}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9975130520917145, "5": 0.0021972823009539337, "3": 0.00027743302645903727, "2": 1.1813755323715766e-05, "1": 2.5483437821467945e-07}, "score": 4.0018954575715515}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.975851579809651, "4": 0.024136689747353557, "3": 1.0932407660770654e-05, "1": 0, "2": 0}, "score": 4.9758414261579285}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9909907100648233, "4": 0.008993461191298792, "3": 1.4617355534449733e-05, "1": 0, "2": 0}, "score": 4.990977293167631}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8314706904319011, "3": 0.1475165509008484, "5": 0.02022898099610918, "2": 0.0007770053672211161, "1": 5.5020104288412055e-06}, "score": 3.8711417496417355}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8940317186175749, "4": 0.10596451553692644, "3": 3.0277690402027547e-06, "1": 0, "2": 0}, "score": 4.894029350710552}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"3": 0.40653233835891256, "4": 0.3528566482983617, "2": 0.22343621436528446, "5": 0.012016426382832493, "1": 0.005158096824424321}, "score": 3.1431371325228468}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7919117184374166, "2": 0.20726846368176138, "3": 0.0007949871555351661, "4": 1.9107550249530793e-05, "5": 5.68755558811763e-06}, "score": 1.2089385183082078}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7537201754116535, "5": 0.12847740842826558, "3": 0.10602202748463717, "2": 0.011374738538905742, "1": 0.00040539688813980365}, "score": 3.99848971281892}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9479593873432605, "5": 0.02982378647520876, "4": 0.013905614493551318, "2": 0.006478475879911805, "3": 0.0018313437352943881}, "score": 1.1711533909899652}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6882618620630419, "3": 0.20752739996600872, "2": 0.0776284185815738, "5": 0.02553096882389707, "1": 0.0010511652166133954}, "score": 3.6595931729508813}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6866452126969028, "2": 0.3129237588693283, "3": 0.0004249580074166371, "4": 5.0910370781124064e-06, "5": 9.953245221993132e-07}, "score": 1.3137929242931163}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9969802773619169, "2": 0.0030175169131125305, "3": 2.292116342836908e-06, "4": 2.5095431985020675e-08, "5": 8.611468289525029e-09}, "score": 1.003022210515005}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9995014228309241, "4": 0.0004764699027661212, "3": 2.161928105513849e-05, "2": 1.6964971935098073e-07, "1": 0}, "score": 4.999479782420361}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.722081937273519, "1": 0.2734761127655528, "3": 0.004290504302159869, "4": 0.00013515247127302542, "5": 1.6041876076342142e-05}, "score": 1.731132754537973}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8892818927704645, "2": 0.10918837253039211, "4": 0.0006324527776447387, "3": 0.00046662435639835913, "5": 0.0004302790096688938}, "score": 1.1137401386717458}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6169537915627645, "3": 0.3486251161041663, "4": 0.033765658962661906, "1": 0.00041569680398833827, "5": 0.0002396553999405832}, "score": 2.416459737227894}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9927139757126172, "2": 0.007279486172245412, "3": 6.406884132422166e-06, "4": 1.4286552982041117e-07, "5": 5.059045069023488e-08}, "score": 1.0072929304451}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6829378152789707, "3": 0.17544513605881054, "4": 0.08530965006434714, "1": 0.05325666062793439, "5": 0.0030502317733125182}, "score": 2.301958623729944}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9781455948867607, "5": 0.021098266463568403, "4": 0.0006813806163109774, "3": 5.59516294671223e-05, "2": 1.8203985578976757e-05}, "score": 1.0865673670974871}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9999869324773808, "2": 1.2448878741910577e-05, "5": 3.920066629417573e-07, "4": 1.39124169057648e-07, "1": 0}, "score": 2.999988474257745}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9385824160773525, "3": 0.048516016424391246, "2": 0.012878067607953682, "5": 1.2631460385256085e-05, "1": 1.0503332187033214e-05}, "score": 3.9257089427000293}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.57850169636604, "5": 0.23702567746063566, "3": 0.16121319458420277, "2": 0.01705506588549437, "1": 0.006201655539966701}, "score": 4.023097447083406}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5796087917499182, "4": 0.4184555321561555, "3": 0.0019174866249527375, "2": 1.6904613248527913e-05, "1": 0}, "score": 4.577658238105963}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.8015228566473215, "4": 0.18882692957148814, "3": 0.008077374478770837, "5": 0.0015722933389463616, "1": 0}, "score": 2.3904483268091106}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9778750078004036, "4": 0.011124920466878685, "5": 0.007340301947061393, "3": 0.003659705863361842, "1": 1.1658922234743475e-07}, "score": 2.047930333524737}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6615463499037882, "3": 0.33147088542018177, "1": 0.0044036184545047504, "4": 0.002560483170046716, "5": 1.8312951796684877e-05}, "score": 2.33224328847943}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9937985538371228, "3": 0.003153723376183284, "1": 0.003042953771299955, "4": 4.805483001453565e-06, "5": 4.344413400446815e-08}, "score": 2.000120510893658}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.47339260645026354, "4": 0.45146717990840557, "3": 0.07513711008373578, "1": 0, "2": 0}, "score": 4.3982567323792345}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985394020130327, "4": 0.0014595803734774873, "3": 3.824931853182378e-07, "1": 0, "2": 0}, "score": 4.9985396537126565}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9986834858660825, "4": 0.0009604613653903432, "5": 0.00012541692133415805, "3": 0.00011785181827243105, "1": 0.00011260077044096367}, "score": 2.002302424964554}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4202441865931158, "2": 0.32706374115538844, "5": 0.1733967079690799, "3": 0.07929055199494232, "1": 3.955557523217525e-06}, "score": 3.439966327193171}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9205985754637379, "4": 0.06626697635987078, "5": 0.006604006953515444, "3": 0.0065148916460617675, "1": 1.5407086377502075e-05}, "score": 2.1588454807739343}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9713377994323712, "4": 0.028377355312996566, "3": 0.00019299852723408132, "1": 6.122652789665633e-05, "2": 3.0021492984528013e-05}, "score": 4.97090165962063}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.534796087286139, "1": 0.4407233873065832, "4": 0.014943999962575002, "2": 0.007874003042991283, "3": 0.001656406139114873}, "score": 3.1952165908746286}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995721639879392, "4": 0.0003877163664369594, "1": 3.586574127931995e-05, "3": 2.794238330344138e-06, "2": 6.565906972775993e-07}, "score": 4.999461261987045}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7624540382669739, "1": 0.15746797101996665, "3": 0.057339244179314644, "4": 0.020399053015872675, "5": 0.0023394222074392974}, "score": 1.9476876316205198}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7205054711681874, "2": 0.2758166901621917, "3": 0.00315965858481633, "4": 0.0003978973104165305, "5": 0.0001201976604335216}, "score": 1.2838105140610432}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5513288080446294, "5": 0.20185999821786357, "3": 0.15210767815873297, "2": 0.09310525980506183, "1": 0.0015940282118405518}, "score": 3.858759118708921}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9926813088127667, "4": 0.007311416122312202, "3": 6.212264964085378e-06, "2": 2.447393671983548e-07, "1": 0}, "score": 4.992675419137707}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7858483296460079, "4": 0.21387246490541115, "3": 0.00027601730360260127, "2": 6.271237169926109e-07, "1": 0}, "score": 4.785573069964307}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7656652616398751, "2": 0.2302050604718617, "3": 0.0036672225565908398, "4": 0.00042227575899686563, "5": 4.024289867903087e-05}, "score": 1.238967289323907}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6041039036086107, "5": 0.37533710881178467, "3": 0.008925240543740645, "1": 0.005872974760494662, "2": 0.005759215566039672}, "score": 4.337275037893678}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8918741890639491, "4": 0.10199145945875546, "1": 0.004030551756952624, "3": 0.0012939522301588036, "2": 0.0008086033967397327}, "score": 4.876872465680739}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9927617790196168, "2": 0.007204292140142696, "4": 2.0695588424407497e-05, "5": 1.2490477549625789e-05, "1": 4.2752374767307117e-07}, "score": 2.992840527098858}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8257247115550397, "3": 0.13517020728151571, "2": 0.01938007504957355, "5": 0.015889154649595703, "1": 0.003834870548549672}, "score": 3.830454019312965}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6233350523653767, "1": 0.3676537428210179, "3": 0.00865630432328556, "4": 0.00033701864592102697, "5": 1.7730309176275423e-05}, "score": 1.641729735431074}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4326024768424616, "2": 0.29691389441747584, "5": 0.2456976165876546, "3": 0.01707743461649602, "1": 0.0077069073021971465}, "score": 3.611671022629465}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9139447800987204, "4": 0.0854695591301429, "3": 0.0005848479845329143, "2": 2.9208908371213355e-07, "1": 0}, "score": 4.913359823520215}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9891973680735606, "3": 0.008132935097272025, "4": 0.002617427536090335, "1": 4.241909259617789e-05, "5": 9.780548418289464e-06}, "score": 2.013354713652295}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6411102435705357, "4": 0.3571066508286509, "3": 0.0017318702240963501, "2": 4.7939009040490324e-05, "1": 2.1780490784146846e-06}, "score": 4.639276676096118}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7170638648743928, "2": 0.2813874313532359, "3": 0.001501025856945258, "4": 4.602075811013591e-05, "5": 1.669420496234027e-06}, "score": 1.2845342195341474}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9753862378918997, "2": 0.02459575529293023, "3": 1.7413983936599807e-05, "4": 4.332014390146302e-07, "5": 1.4438045107781111e-07}, "score": 1.0246324607625537}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7782745072140813, "4": 0.2153462890092274, "3": 0.005122055272849234, "1": 0.0007112920877027111, "2": 0.0005452260928833355}, "score": 4.769928608796265}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9355016074410882, "1": 0.058596014304141644, "4": 0.005803761715636514, "2": 5.335573971328519e-05, "3": 4.044360594531491e-05}, "score": 4.7595700684392686}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5385453879773727, "3": 0.22399570531764063, "4": 0.20627816613756758, "1": 0.016557402436959544, "5": 0.014621503373827206}, "score": 2.663860363299502}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.9975561138640927, "2": 0.0024099068106675295, "4": 3.3707371690561726e-05, "5": 6.043067479977058e-08, "1": 0}, "score": 2.9976239209197773}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.43104548965700723, "4": 0.4055047871287714, "3": 0.12923682564944383, "5": 0.03397805173570377, "1": 0.00023461891462380816}, "score": 3.041946172632117}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8466134702711343, "3": 0.10671758781533958, "4": 0.046593636638342074, "2": 7.399182084429847e-05, "1": 0}, "score": 4.73974887044047}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.900144619710166, "3": 0.08013656797975022, "4": 0.014937502230025634, "1": 0.004220667449719903, "5": 0.0005605654228287324}, "score": 2.1074726095562597}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.667648447616852, "3": 0.22455960633061126, "5": 0.07818574007821444, "2": 0.029592761247774414, "1": 1.236899029740646e-05}, "score": 3.7944032831133208}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5351126144167597, "1": 0.46476141085895756, "3": 0.0001256141061657042, "4": 3.367385579870283e-07, "5": 0}, "score": 1.535364865629042}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8273777059699812, "1": 0.16343946530246425, "3": 0.009145500219019118, "4": 3.698829672813183e-05, "5": 3.4106253137773814e-07}, "score": 1.845781034828803}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7131366299981918, "2": 0.2307641467006413, "3": 0.03684568365659168, "4": 0.018726875394772472, "5": 0.0005248232598269281}, "score": 1.3627361010309755}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7642318555532961, "1": 0.22697935789926174, "3": 0.0076844643894709835, "4": 0.0010869077946173188, "5": 1.7268699027468703e-05}, "score": 1.7829306965572727}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8154624690427831, "3": 0.1554047306109529, "2": 0.014678433078713235, "5": 0.014447917391015029, "1": 5.932279603630029e-06}, "score": 3.829668435620729}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8955180512065002, "4": 0.06872041241099523, "5": 0.018691501942294467, "3": 0.016765283315200913, "1": 0.000304575059612583}, "score": 2.2099760758739833}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6954225170051264, "4": 0.2927937039585428, "3": 0.009511166971653873, "2": 0.0021709313716194107, "1": 0.00010090551237858625}, "score": 4.681267298858346}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9896547253083696, "4": 0.010229904851402785, "3": 9.0941874253374e-05, "2": 2.1498852421486658e-05, "1": 2.0949811547011746e-06}, "score": 4.9895153261726}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7034594812747835, "4": 0.2741640579861831, "2": 0.020638999776167954, "3": 0.0017355619977880098, "1": 9.721195949332443e-07}, "score": 4.660443615495056}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9833873742126781, "4": 0.01637343622059459, "3": 0.00020271915696862676, "2": 3.475983515342266e-05, "1": 1.2066037054015915e-06}, "score": 4.983112011034131}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9383365303121873, "3": 0.048751412870464673, "2": 0.012888575244326368, "5": 1.2536564796009466e-05, "1": 1.049849126681284e-05}, "score": 3.92545244444513}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.38601721965775765, "3": 0.20790492398647742, "5": 0.17696328452278098, "2": 0.1318922866157891, "1": 0.09721862214617248}, "score": 3.4136157728991376}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5017472861949688, "4": 0.4953836827473062, "3": 0.002825985855113559, "2": 4.1951557424801445e-05, "1": 0}, "score": 4.498837942776721}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.4966358587485391, "4": 0.4537784026455458, "3": 0.04558288326159204, "5": 0.004002232294109461, "1": 0}, "score": 2.9651469867700486}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3719574027508092, "2": 0.3371268533572806, "5": 0.268948652634578, "3": 0.021946039248558424, "1": 2.035599693108261e-05}, "score": 3.5726875412661334}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6757840747592183, "4": 0.28735422236007857, "2": 0.03416126087097925, "5": 0.0026737328815513283, "1": 2.6349401413240475e-05}, "score": 3.2584878214343624}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9539679657271433, "3": 0.03629723904392501, "4": 0.008469430583735987, "1": 0.00122358610694213, "5": 4.163376755048314e-05}, "score": 2.0521374229550777}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.8642404848157937, "2": 0.13511917664643647, "3": 0.0006100780244757093, "4": 2.78193148427042e-05, "5": 2.2584586288411045e-06}, "score": 1.1364318494059633}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4901109132108601, "5": 0.25058499866097506, "1": 0.24596987743464085, "3": 0.010487998243477651, "2": 0.0028352547129516298}, "score": 3.496511341591323}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9902299689107803, "4": 0.005405090955515962, "5": 0.0025751383967501, "2": 0.0012115512689876559, "3": 0.0005761174568007421}, "score": 1.028879674236805}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9176088210844165, "3": 0.0748938800556148, "1": 0.006767499570100111, "4": 0.0007270746525057689, "5": 2.63622655106501e-06}, "score": 2.0695884446225503}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8313259938647989, "5": 0.12524026081556885, "3": 0.03461912513713791, "2": 0.0062622696229643685, "1": 0.0025506720640673048}, "score": 4.070444698481407}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6743456268674249, "5": 0.3182468307373562, "2": 0.004137059538075761, "3": 0.0032699878816410833, "1": 0}, "score": 4.3067028755899734}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3829125671752536, "5": 0.29136788518320517, "2": 0.24147046777816178, "3": 0.07855578261457272, "1": 0.005690594811589315}, "score": 3.712798606433806}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9949980881327634, "5": 0.004821560249907146, "3": 0.00017693856075979788, "2": 9.187920672358374e-07, "1": 0}, "score": 4.004642795685373}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9039838172701716, "3": 0.07343937816191025, "1": 0.016134023111444847, "4": 0.006306351366609151, "5": 0.00013639431395100923}, "score": 2.070327243241558}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7513885756827293, "3": 0.24377921984538736, "4": 0.0042440002471298265, "1": 0.0005330725642536747, "5": 5.514100093069051e-05}, "score": 2.251899568425335}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6245151127184659, "5": 0.3035156514380213, "4": 0.06808199441354736, "3": 0.0038849013034601035, "1": 0}, "score": 3.0505983029775536}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.47707775165686567, "2": 0.2878995339950747, "4": 0.21847084627667343, "5": 0.016421037365575392, "1": 0.00013035044548293526}, "score": 2.9631526684254723}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8126922234921201, "5": 0.18646323326561243, "3": 0.0007982242379900788, "2": 3.4863539092669405e-05, "1": 1.122086013426591e-05}, "score": 4.185561662902738}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5608533588795218, "2": 0.43029849358153893, "3": 0.008014851667131385, "4": 0.0008175624227532882, "5": 1.505143834860738e-05}, "score": 1.4488413960520934}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9296470081643403, "1": 0.05409171755238283, "3": 0.016061679489455114, "4": 0.00019871558036117985, "5": 7.864395318380079e-07}, "score": 1.9623697489252838}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6259521428035715, "4": 0.372662609815267, "3": 0.001357047357587943, "2": 2.529504578956583e-05, "1": 1.7109770095402265e-06}, "score": 4.624540118124761}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9582546616306898, "5": 0.024786185928897073, "3": 0.016441083256668602, "2": 0.0004986138048668897, "1": 1.8987351709008816e-05}, "score": 4.007290916419715}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9495313897827921, "4": 0.05037517927060172, "3": 8.956302415494886e-05, "2": 3.1567138258335108e-06, "1": 4.677069090157853e-07}, "score": 4.949434341399151}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"2": 0.743662816876205, "1": 0.25106003128008825, "3": 0.005243096605218893, "4": 3.3527887592254347e-05, "5": 5.123601711198025e-07}, "score": 1.7542516544968827}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9952354795096539, "3": 0.00403382387718661, "1": 0.0006318771282783489, "4": 9.707574576665527e-05, "5": 1.2675356191277329e-06}, "score": 2.003599902561585}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9707682409234036, "4": 0.02896578422158389, "3": 0.0002510852588038831, "2": 1.4168292678252628e-05, "1": 0}, "score": 4.97048951909676}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6447430072217064, "5": 0.34846084779981296, "3": 0.006757010638310928, "2": 3.809509592482792e-05, "1": 0}, "score": 4.341628002004588}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9972724363795162, "4": 0.00272032641597826, "3": 5.156853248799915e-06, "2": 7.328439866042835e-07, "1": 0}, "score": 4.997267157663039}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9816329475499957, "3": 0.010488372671698444, "1": 0.007117135157846193, "4": 0.0007578300544739595, "5": 3.7697909838157655e-06}, "score": 2.004898206725248}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9269417986640439, "3": 0.061054534866291386, "5": 0.007915657650233382, "2": 0.004078169676182046, "1": 8.900358510133564e-06}, "score": 3.938678024787913}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8964121436626845, "5": 0.06141008539931269, "3": 0.035802358781306255, "2": 0.006334987743111091, "1": 4.002409140604983e-05}, "score": 4.01281768398877}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6324413436456268, "5": 0.36674877577552334, "3": 0.0007983838988032262, "2": 9.99707507754428e-06, "1": 0}, "score": 4.36593094647843}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9895317940754358, "4": 0.010458010909960687, "3": 8.672902917253295e-06, "1": 6.055050098994278e-07, "2": 0}, "score": 4.989522211660153}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7735431462358492, "5": 0.16348997590072822, "4": 0.04141296843418474, "2": 0.015643965928795366, "3": 0.005908913531981965}, "score": 1.8056614317040907}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8470599733907428, "3": 0.08085413097126773, "1": 0.06799568715558515, "4": 0.0038188471313109463, "5": 0.00027132071137114946}, "score": 2.0213101010784547}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.49665319164246674, "3": 0.32806740128039535, "4": 0.17044863306435856, "2": 0.004829963829799711, "1": 3.4295074523153046e-07}, "score": 4.158924908105077}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6461458284761324, "4": 0.22540222637164967, "5": 0.06955770382724469, "3": 0.05762039465950155, "1": 0.0012721365108143046}, "score": 2.7158270465486787}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6071907723914319, "5": 0.3801631181793541, "3": 0.00988243539626727, "2": 0.0027569342378992133, "1": 6.22944072788206e-06}, "score": 4.364748312135982}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"2": 0.26028453004503266, "5": 0.20738317705524476, "4": 0.20014723665681844, "3": 0.1706766240960345, "1": 0.16150678900827872}, "score": 3.031615534654422}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7343201748205389, "4": 0.2577494989564132, "3": 0.005459465433340612, "1": 0.001519000084104755, "2": 0.000951305791295975}, "score": 4.722401498423218}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7647428847617226, "5": 0.16769973338286565, "3": 0.06499105070675483, "2": 0.0025215007979224827, "1": 4.3315457522395635e-05}, "score": 4.097535882464146}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6113387832927115, "3": 0.2702099309663191, "2": 0.0807176109604116, "5": 0.037598440707177695, "1": 0.0001345054283846012}, "score": 3.6055494841204876}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8783230364063759, "4": 0.08977686185135968, "2": 0.03094537888642618, "5": 0.0009537766818781641, "1": 0}, "score": 3.0607390937984387}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5297354913176018, "1": 0.465239449859282, "3": 0.004859146858489406, "4": 0.0001368523432311185, "5": 2.8955540226770764e-05}, "score": 1.5399802204269533}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9825302115915325, "2": 0.01735299786339067, "3": 0.00010767447530359839, "5": 4.783375926364274e-06, "4": 4.342553581704845e-06}, "score": 1.0176005078049122}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8666858753681168, "3": 0.09523071049236626, "4": 0.024455168373030044, "1": 0.011772432612596544, "5": 0.0018555706540789054}, "score": 2.137935360037365}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.976794391411837, "4": 0.023129313112547584, "3": 7.422400073889144e-05, "2": 1.891780705946765e-06, "1": 0}, "score": 4.976716559359959}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9849555999686193, "2": 0.015025011998381804, "3": 1.7614502315834233e-05, "5": 1.20000480141399e-06, "4": 5.612423658676533e-07}, "score": 1.015066724934389}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9927855135570096, "4": 0.0070592843462619495, "1": 9.143794614146917e-05, "3": 5.361053289274054e-05, "2": 1.0003655317606864e-05}, "score": 4.992437730703378}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5140211327872823, "1": 0.4849826315126587, "3": 0.0009847783179896875, "4": 1.1144148455637385e-05, "5": 2.777690010904183e-07}, "score": 1.5160252512452685}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9579761566455226, "4": 0.03729490711971566, "3": 0.004647359825932366, "2": 8.072784490568062e-05, "1": 0}, "score": 4.953168149953885}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.997163968457137, "4": 0.001759959643543145, "5": 0.00098351142846933, "3": 9.15356540346759e-05, "1": 9.521988004058577e-07}, "score": 2.0065610375041785}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6622775573454777, "5": 0.11105535591981419, "2": 0.10125910004971145, "3": 0.084830723192617, "1": 0.04057549362147122}, "score": 3.7019794243054136}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8602394657049868, "5": 0.08127323739129655, "3": 0.05256139311105388, "2": 0.0056434866732775904, "1": 0.0002807294959888322}, "score": 4.016582710431091}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8998503025430513, "1": 0.08829973257257223, "3": 0.011752510519267737, "4": 9.619944206976738e-05, "5": 1.3255527708190009e-06}, "score": 1.9236491588817868}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5293608730626983, "5": 0.43577104487228197, "3": 0.03379742712339837, "2": 0.0010697751422738498, "1": 0}, "score": 4.399834419238397}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7039119511747266, "4": 0.2385529931104033, "5": 0.048843518059184604, "3": 0.00865947917215388, "1": 3.152215266806448e-05}, "score": 2.632264836520992}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5422033301579342, "4": 0.2252819612990244, "2": 0.2206551066208628, "1": 0.00875725306731364, "5": 0.003098165862026987}, "score": 2.9933086522777286}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.638736035457923, "1": 0.3594442824728315, "3": 0.0018015425659415594, "4": 1.7809295818324272e-05, "5": 2.7733796062128107e-07}, "score": 1.642393691792153}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9101230261842571, "1": 0.08160930431860058, "3": 0.008197997187266609, "4": 6.912341692579542e-05, "5": 3.6233994180767376e-07}, "score": 1.9267280130532334}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5288868839240404, "4": 0.446411770792457, "3": 0.023458726995394336, "2": 0.0012021487481317537, "1": 4.0034458988268e-05}, "score": 4.502903974859376}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.8870997404838971, "1": 0.11233851620935678, "3": 0.00048038100908653637, "4": 7.813589528369527e-05, "5": 3.1637674800425277e-06}, "score": 1.8883076208968967}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6690209125001135, "5": 0.29433620811466277, "3": 0.030151325296766653, "2": 0.006474602909469195, "1": 1.580505077043079e-05}, "score": 4.25118854974093}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5189177428478565, "3": 0.16853926999381763, "1": 0.15900498898341164, "4": 0.14642665856628947, "5": 0.007110801592220251}, "score": 2.3237201770864115}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7445675492100531, "1": 0.13078482022754184, "3": 0.1050004125273948, "4": 0.017206581895819414, "5": 0.0024401794434099683}, "score": 2.015949301705701}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7933030293600108, "5": 0.12207581412509069, "3": 0.08191891192046788, "2": 0.0026788820955708833, "1": 2.2082303871329686e-05}, "score": 4.0347329355667965}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6812830639117795, "4": 0.3177380429469501, "3": 0.0009724000150938899, "2": 5.005030756805941e-06, "1": 0}, "score": 4.680301666188966}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7554737372134742, "4": 0.24411269391651366, "3": 0.0003802850708673702, "2": 2.6630989539611066e-05, "1": 5.149690202254739e-06}, "score": 4.755025875986965}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7114500626007989, "1": 0.17162174171211264, "3": 0.0820349420435474, "4": 0.028790269889033347, "5": 0.006102189120310753}, "score": 1.986300296584181}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7004861885213147, "4": 0.2966011120380301, "3": 0.002678460740557689, "2": 0.00021710726886415804, "1": 1.669018893671836e-05}, "score": 4.697323750364953}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8219206922732439, "1": 0.16078551614809947, "4": 0.016186705852999306, "3": 0.0007863301622340901, "2": 0.0003181056492546018}, "score": 4.338142498416799}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.649949767401206, "5": 0.3496779468344083, "4": 0.0003547880461126149, "2": 7.8657237820372e-06, "3": 7.848500998573738e-06}, "score": 2.3998022107398835}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9769270354204651, "5": 0.01750574790967121, "4": 0.005305644633353302, "1": 0.00016013985992877175, "3": 0.00010129525387287285}, "score": 2.063069697025338}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6864866365659956, "1": 0.3066857411927181, "3": 0.0067043614612831365, "4": 0.00011405063973491789, "5": 9.04543814242493e-06}, "score": 1.7002738084969213}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6787589444458806, "2": 0.3199607970218377, "3": 0.0012744029303185028, "4": 5.471181327715468e-06, "5": 3.3924305841603224e-07}, "score": 1.3225273879696973}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.6158450618848593, "2": 0.36633637876533914, "3": 0.012784017769238216, "4": 0.0038705719196653276, "5": 0.0011600501987682212}, "score": 1.4081579306174365}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5461666663997974, "1": 0.45150309555109297, "3": 0.0023199329374343743, "4": 9.410814982383345e-06, "5": 4.194892236193415e-07}, "score": 1.5508367042178894}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6781503910033728, "1": 0.2988339831785184, "3": 0.022336883459926352, "4": 0.000654173140970387, "5": 2.4183983082986346e-05}, "score": 1.7248836925284066}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7913994143886022, "3": 0.19345973036100572, "4": 0.014815282938928927, "1": 0.0002613037589419099, "5": 6.414695082427257e-05}, "score": 2.2230214604521823}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8185735227488575, "1": 0.17890468517817779, "3": 0.002496167807914162, "4": 2.384542936204049e-05, "5": 1.7745813890602554e-06}, "score": 1.8236444964823588}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5320248235078656, "3": 0.44437079108862826, "5": 0.017201615072621523, "2": 0.006390466554718825, "1": 1.197086831607362e-05}, "score": 3.560013831794759}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7422547246873664, "1": 0.21953649413291326, "3": 0.03652860962799099, "4": 0.0016578329189412251, "5": 2.1980233186810728e-05}, "score": 1.820373657654511}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.743127356852238, "3": 0.24532488148096476, "4": 0.008522994779169563, "1": 0.002890343863574529, "5": 0.00013423541111697485}, "score": 2.259883282166546}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7362254052553389, "3": 0.2440022823107742, "4": 0.014263281089998645, "1": 0.004930780436039107, "5": 0.0005780287211242767}, "score": 2.2693322100601465}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9623943548877294, "3": 0.03451515417286782, "1": 0.00207425961711623, "4": 0.0010147459432864935, "5": 1.3463962221008988e-06}, "score": 2.0344744304223426}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979921312707524, "4": 0.0019767887387754984, "3": 3.038197661130138e-05, "2": 2.3010387489478787e-07, "1": 0}, "score": 4.997961756042662}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9904101388280039, "4": 0.004601370891476487, "1": 0.0029475292557119156, "3": 0.001927970275855546, "5": 0.00011287799644515874}, "score": 2.008521817753288}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7959313743360394, "3": 0.16087144680370777, "1": 0.030627278894626016, "4": 0.012472356046092963, "5": 9.750733032168926e-05}, "score": 2.1554814076811755}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6678885370980079, "2": 0.16728788306533382, "5": 0.16033788647094785, "3": 0.004481053965806164, "1": 3.848219439075526e-06}, "score": 3.821269380307982}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9346900144603162, "4": 0.06515110595743209, "3": 0.0001522537532179932, "2": 4.991814934501059e-06, "1": 0}, "score": 4.9345293041112885}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5977153928571142, "5": 0.3985396291099607, "3": 0.0036898517422090478, "2": 5.330822092196582e-05, "1": 0}, "score": 4.394743878597829}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7797694967183635, "5": 0.07240242396292618, "4": 0.07140444190621636, "2": 0.06586886548659678, "3": 0.010544498755880403}, "score": 1.5907869538235317}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.40081616427390604, "2": 0.36537074543411796, "3": 0.17113153630812186, "5": 0.0626680143165624, "1": 9.603710728085494e-06}, "score": 3.160762872807141}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"4": 0.48345463246551423, "3": 0.42754817794832534, "2": 0.08736546602285146, "5": 0.0016246741603732186, "1": 6.923390165440071e-06}, "score": 3.399324718303092}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8769563322841205, "3": 0.07998523690700875, "5": 0.04084318914391448, "2": 0.0022093708218092344, "1": 5.036415193929449e-06}, "score": 3.9564240649867273}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9148064684213644, "4": 0.08504110084554091, "3": 0.0001499088672753324, "2": 6.112266483472318e-07, "1": 0}, "score": 4.914657084680448}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9999700059218314, "4": 2.6201968930546123e-05, "5": 3.4582564918035537e-06, "2": 1.2474564658973167e-07, "1": 0}, "score": 3.0000329937431665}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9332921662957364, "5": 0.06661772471380516, "3": 6.687575921933902e-05, "1": 0, "2": 0}, "score": 4.066552395181772}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9563868432763121, "5": 0.03817681823752036, "3": 0.0052797211244387365, "2": 0.00015629989379994474, "1": 0}, "score": 4.032584507670018}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8205809942822033, "4": 0.17158239335819925, "1": 0.006041527510014224, "3": 0.0015754584022554812, "2": 0.00021178562451987248}, "score": 4.800463658394574}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9884926093803221, "4": 0.010550553035578326, "1": 0.0008407283151040369, "3": 8.507017958095885e-05, "2": 2.7711945285044755e-05}, "score": 4.985833210374038}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6060405384610232, "1": 0.21682569436401083, "4": 0.15577385047070608, "3": 0.013429234088083868, "2": 0.007919115964735907}, "score": 3.926295136832974}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7941553833236237, "5": 0.19575310150934247, "3": 0.009762136488524881, "2": 0.0003184934972366138, "1": 9.754917901184618e-06}, "score": 4.185324922738613}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9501244119639549, "1": 0.04907265126877945, "3": 0.0007993928947142057, "4": 3.332475955744485e-06, "5": 0}, "score": 1.9517333963744505}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7118155429676194, "4": 0.15448859563947512, "2": 0.08869926287649058, "3": 0.04215732607621715, "5": 0.0028382545807110896}, "score": 1.647833379673546}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9192131965413533, "4": 0.06096229626037142, "1": 0.01939140213631115, "3": 0.0003868740384332143, "2": 4.506831987858216e-05}, "score": 4.86056298003395}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.45056104775710304, "1": 0.4062824100238827, "4": 0.13898356364520362, "3": 0.0032620775542650873, "2": 0.0009054058153688476}, "score": 3.226636678711099}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8976882816977243, "1": 0.0747954817677931, "4": 0.01676489771811905, "3": 0.010661560314386925, "5": 8.967468923594457e-05}, "score": 1.969664894901369}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"1": 0.994523516909373, "5": 0.005351391277567904, "4": 5.822332560081423e-05, "2": 5.3139288865755054e-05, "3": 1.2972316125254982e-05}, "score": 1.0216593354017616}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9848332583525752, "4": 0.015045738259715079, "1": 8.254227265791934e-05, "3": 3.206238569845845e-05, "2": 5.905062642432034e-06}, "score": 4.98454224505935}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9989019459030799, "1": 0.0006269084755474129, "4": 0.0004636201422343384, "3": 4.192635601264515e-06, "2": 0}, "score": 4.99702035075367}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6337884216732641, "2": 0.19196195070591354, "5": 0.13866300693956746, "4": 0.0333378863663285, "3": 0.00224347337552995}, "score": 1.8511190620000326}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8407804427312855, "3": 0.08028718177295324, "5": 0.06361483379887124, "2": 0.015142766799711016, "1": 0.00017202925644585555}, "score": 3.9525259003103366}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6599188408051199, "4": 0.3175566663123846, "2": 0.02133230475632925, "5": 0.0011742472206206708, "1": 1.7611331990755194e-05}, "score": 3.2985377317234565}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8442322453698144, "3": 0.14136631200213506, "5": 0.0100590716488015, "2": 0.004338177282835445, "1": 2.5656928470686828e-06}, "score": 3.860008480095761}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9920791604899774, "4": 0.00778709034831394, "3": 0.00013225919000491094, "1": 0, "2": 0}, "score": 4.99194837927499}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8902632174834071, "5": 0.0748600431572407, "1": 0.03368046780524662, "3": 0.0010491388438845688, "2": 0.00014474876116404316}, "score": 3.972479937768862}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8316388391203136, "5": 0.0741741479422234, "4": 0.0640936489697093, "3": 0.016802913247785583, "2": 0.013281628691786732}, "score": 1.5358697213231625}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5194766326066179, "4": 0.4238567222836725, "2": 0.04778498548597715, "5": 0.008781794563694727, "1": 8.93580701310891e-05}, "score": 3.393460743872887}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7644024664292641, "3": 0.13863146469355522, "5": 0.08352780571362417, "2": 0.01318816556019294, "1": 0.00024091677887024026}, "score": 3.91779650486721}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9967660925795868, "4": 0.003146898859877168, "3": 5.853656243898277e-05, "1": 2.4155680213360523e-05, "2": 2.3214373887970906e-06}, "score": 4.996632434264334}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9853255704961955, "4": 0.014648929761648641, "3": 1.643898351887347e-05, "2": 1.3417659922572658e-07, "1": 0}, "score": 4.985317658678391}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9980006820041648, "4": 0.0019947319471471355, "3": 1.4160715985830208e-06, "1": 1.4568836249446948e-07, "2": 0}, "score": 4.998001847113215}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7530203246345211, "4": 0.1769840966287687, "2": 0.06993154108301722, "5": 4.0982885714589076e-05, "1": 2.2957290570214154e-05}, "score": 3.107088617174761}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8699536192165043, "3": 0.09549574380266258, "5": 0.02702334383597093, "2": 0.007513762049141079, "1": 1.3346531761715787e-05}, "score": 3.9164600209212717}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7981362154872014, "4": 0.20180197181007176, "3": 5.8994343000672445e-05, "2": 5.569095488846184e-07, "1": 0}, "score": 4.798077912138537}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.584075426224282, "1": 0.23085730190770595, "3": 0.14776839937386965, "2": 0.02457405665632559, "5": 0.012719200205157835}, "score": 3.123225858154013}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6826664492311204, "5": 0.19250570294592756, "4": 0.12393805433675896, "3": 0.0004965591239988564, "2": 0.0003898377231184596}, "score": 2.1432238138837816}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5149713041334749, "3": 0.24596215410174635, "5": 0.12592984661286802, "2": 0.11127672077883145, "1": 0.0018592618962276813}, "score": 3.65183621720614}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7814411233206916, "5": 0.1825003660879925, "3": 0.035373171974021594, "2": 0.0006775697896243438, "1": 7.137471328592654e-06}, "score": 4.145750734141387}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.993347585634036, "4": 0.006628458537041793, "3": 2.244445427285287e-05, "2": 5.687749497221886e-07, "1": 4.610473904465245e-07}, "score": 4.9933230988247255}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9449272959034409, "4": 0.05450728044979579, "3": 0.0002688927383700464, "1": 0.0002253213392920366, "2": 6.80093066263998e-05}, "score": 4.94384944109989}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9784478249784399, "4": 0.021518081441704733, "3": 3.2682509527289925e-05, "2": 3.060761223749299e-07, "1": 0}, "score": 4.97841561146025}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8787296974691066, "1": 0.11139621820006303, "3": 0.009780496787085346, "4": 8.961032591826921e-05, "5": 3.947196412673058e-06}, "score": 1.8985753377831849}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8353431838043286, "5": 0.10157142839207473, "4": 0.06016909082311905, "3": 0.0021528709543391076, "2": 0.0007608966632947854}, "score": 1.5918611216411587}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6446368138998789, "5": 0.3359586137394138, "4": 0.01859870173300263, "2": 0.0008033600206285812, "1": 5.085409976639126e-07}, "score": 3.6897129329600737}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5645982571743775, "4": 0.34233708454727707, "5": 0.07961211493793065, "2": 0.013401835550845322, "1": 3.638608997139732e-05}, "score": 3.488093697023655}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.712754640865322, "5": 0.2546863986182466, "2": 0.01923976784664627, "3": 0.012035022959758265, "1": 0.0012827808737809433}, "score": 4.200323775560773}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4705688626935318, "2": 0.46640487108178313, "4": 0.06081763394931994, "1": 0.0017703057627484324, "5": 0.00043785633660931787}, "score": 2.591747672064809}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4646759769745085, "2": 0.4386894760685641, "4": 0.09047449420385144, "1": 0.004905096070098208, "5": 0.0012511723339882165}, "score": 2.6444758252355163}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9562760809664931, "1": 0.027633604293560415, "3": 0.01579677142530631, "4": 0.00028798475881786057, "5": 5.5608588066614254e-06}, "score": 1.9887558192516963}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6531506185657161, "5": 0.3468347282361811, "3": 1.2914343048952931e-05, "1": 0, "2": 0}, "score": 4.346822416967045}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7474219753261021, "4": 0.25115469875557866, "3": 0.001417279627580591, "2": 4.307977592729206e-06, "1": 0}, "score": 4.745997376520382}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.50460052618463, "3": 0.46170519390914105, "5": 0.02995091511887972, "2": 0.003742859453212777, "1": 3.6127369788126946e-07}, "score": 3.560758855204948}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6433682323799003, "2": 0.3030142938993925, "4": 0.030441075950909734, "3": 0.02229080092940462, "5": 0.0008852822829758216}, "score": 1.4424603919220322}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4918055815682552, "4": 0.4199837747493951, "5": 0.08813755146676043, "2": 7.263591946609437e-05, "1": 0}, "score": 3.596186513801045}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6774343373268488, "1": 0.3000082214104314, "4": 0.020712137456325552, "2": 0.0013398668977368492, "3": 0.0005028471051379853}, "score": 3.774226507485958}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4875676007269155, "4": 0.3013917395800263, "5": 0.20215118923079453, "2": 0.008563485389755328, "1": 0.0003250075971700182}, "score": 3.6964812982508124}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9990683704365411, "2": 0.000931156216924515, "3": 4.7610139056917215e-07, "5": 1.4744584118409458e-08, "4": 1.0928191614521141e-08}, "score": 1.0009322001561165}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9975160175029235, "4": 0.001405066003106257, "3": 0.0009956308516039696, "5": 8.28134558094812e-05, "1": 5.081790453438926e-07}, "score": 2.004053694900297}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9317659895474601, "4": 0.05657127112108427, "5": 0.011541546670229637, "2": 0.00012081585875448408, "1": 1.345276611421498e-07}, "score": 3.0795332988163815}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9997239246958022, "3": 0.00017885842264888556, "5": 9.638152732206764e-05, "1": 0, "2": 0}, "score": 3.9999175230357755}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8750222275787756, "3": 0.1224431546955991, "2": 0.002182500589821832, "5": 0.00035142613888116477, "1": 3.7964850467061834e-07}, "score": 3.8735420919456547}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5571625780757152, "3": 0.4330373049810945, "4": 0.008841656791858532, "2": 0.0008167495977369162, "1": 0.00014148837496221682}, "score": 4.122067335895014}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5305576265320237, "5": 0.44123838236459834, "4": 0.022886112349632014, "2": 0.00308339350864209, "3": 0.0022304319783618973}, "score": 2.8411635866997877}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9966211411347474, "4": 0.0033515478335065696, "3": 1.9565025479553217e-05, "2": 3.574393666424487e-06, "1": 3.071731957203938e-06}, "score": 4.996586308252054}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6761339714205278, "5": 0.31316859227076166, "3": 0.010006103721894317, "2": 0.0006897630673457089, "1": 1.259822147174532e-06}, "score": 4.301779276407968}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6241180161810351, "1": 0.23674077803696417, "4": 0.11024346949665398, "2": 0.023445832932195043, "3": 0.005444581963089925}, "score": 3.861558420657859}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"2": 0.992389941247818, "3": 0.004289251657798615, "1": 0.0032332482400420155, "4": 8.339072214930085e-05, "5": 4.1013515181487635e-06}, "score": 2.00123508899909}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8255415613571307, "4": 0.16932575076859346, "1": 0.0032569079998043342, "3": 0.0014258398078661886, "2": 0.00044728731811792587}, "score": 4.813452580798719}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5635617886279102, "4": 0.41855840535362715, "3": 0.009747908790527254, "1": 0.005872217195614542, "2": 0.0022567927743619436}, "score": 4.531685177814076}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5464440802624136, "5": 0.2828379104554046, "4": 0.14025762063178124, "2": 0.024190042438010494, "3": 0.006262364810186058}, "score": 2.5888519570418564}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9994309248847006, "4": 0.000258861082800697, "5": 0.0001370331761189926, "1": 9.106764280964713e-05, "3": 8.205596856920723e-05}, "score": 2.000919810072373}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6417763182135631, "2": 0.3574449552612766, "3": 0.0007684930796776107, "4": 8.633660352295532e-06, "5": 1.5347255311214646e-06}, "score": 1.3590140046611205}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8202639256180528, "4": 0.09387144867246029, "5": 0.08569341449756918, "2": 0.00016937489267223002, "1": 7.920027285492329e-07}, "score": 3.265087595604824}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6667287282939979, "4": 0.30542943776342285, "3": 0.014730884541074341, "5": 0.013000974016254743, "1": 0.00010917526841718253}, "score": 2.6644840385131316}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9956703092542522, "1": 0.003623242267491469, "4": 0.000559960674952476, "3": 8.634488420518482e-05, "5": 5.983528624766247e-05}, "score": 1.9977625291370422}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.36520278658206656, "2": 0.3231446898079757, "3": 0.31095020256292066, "5": 0.000667603582469106, "1": 3.4300692997079176e-05}, "score": 3.0433247206095464}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7109694484026134, "4": 0.2590725087239422, "3": 0.0264779915129199, "5": 0.00347897697888027, "1": 6.577006160278288e-07}, "score": 2.5550595134795975}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9911130653307231, "4": 0.00882586468199492, "3": 5.3908521188155655e-05, "2": 5.219390110315618e-06, "1": 1.350101207237293e-06}, "score": 4.991045254399484}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9806220919558144, "4": 0.018304629005523508, "3": 0.0010644761273976115, "2": 7.447843727625313e-06, "1": 0}, "score": 4.979544047489301}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5868315898864476, "3": 0.3223038322215909, "5": 0.09085762119375924, "2": 4.08894323109693e-06, "1": 0}, "score": 3.768544947329328}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6388332584810041, "4": 0.2603170416131404, "5": 0.10083855564498224, "2": 8.26911556193678e-06, "1": 0}, "score": 3.4619872120679096}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6203850781199726, "3": 0.28949365479958816, "4": 0.08962589446755177, "5": 0.0004744408050319926, "1": 2.0536433609802338e-05}, "score": 2.4701484156007525}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.995455745511421, "1": 0.004209018895058711, "4": 0.00014275181428239833, "3": 9.885721713861756e-05, "5": 9.334754380492416e-05}, "score": 1.9964553835930465}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7482538925931853, "4": 0.23586699814556716, "1": 0.007160954477362168, "3": 0.006335304500417112, "2": 0.0023796439579251943}, "score": 4.715678731443829}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8992070316300583, "5": 0.10018372787261473, "4": 0.00040924604736514543, "2": 0.00014212252788412428, "3": 5.579161325292484e-05}, "score": 1.4022171921229185}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9875614107887066, "4": 0.012140321633539088, "1": 0.00023258472284054418, "3": 5.0660755518008784e-05, "2": 1.3685728273106812e-05}, "score": 4.986786943121696}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6371575390097423, "2": 0.2655429715458153, "3": 0.049763076783346995, "4": 0.034021860673212126, "5": 0.013514439129052475}, "score": 1.5211925224695342}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5895068317578639, "5": 0.2998229935371432, "3": 0.05061704002459915, "1": 0.04815524578226932, "2": 0.011894663795279132}, "score": 4.080951149650961}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.765249863140112, "4": 0.23262894628856026, "3": 0.001971062187630603, "2": 9.686938822196365e-05, "1": 5.270411615811255e-05}, "score": 4.762927373160183}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.45144654832971887, "4": 0.39111568233741045, "1": 0.1485388409084285, "3": 0.005546785545527101, "2": 0.0033425108597606203}, "score": 3.993598156676707}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.524017446692853, "4": 0.31835686768553273, "1": 0.13697660967906827, "3": 0.01210207201657813, "2": 0.008540195322124983}, "score": 4.083905726275671}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6612612650250705, "3": 0.25557282004120224, "4": 0.06902990931305351, "1": 0.008477517666827288, "5": 0.005658295955669499}, "score": 2.402130086075734}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8715969284100258, "2": 0.12531851031724972, "3": 0.0027951346450313923, "4": 0.00026795031136435474, "5": 2.152610873073037e-05}, "score": 1.1317987284137532}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5907875509855195, "3": 0.2773003677999841, "2": 0.11311112911929372, "5": 0.01876654341707442, "1": 3.424517085949807e-05}, "score": 3.5151411025879704}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9970100199205879, "1": 0.001572051224415461, "4": 0.0006256408960161187, "3": 0.0005840131840282667, "5": 0.00020825568049550515}, "score": 2.0008880108100877}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9768750379089989, "2": 0.017191598049582913, "4": 0.003268761866077753, "3": 0.0016488239545801855, "5": 0.0010137398144331722}, "score": 1.0343505608351098}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9322350654030366, "1": 0.062223508529954556, "4": 0.005145251646540485, "2": 0.00023033587228049878, "3": 0.00016472419963024868}, "score": 4.744939973991768}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6066070691923875, "4": 0.3638100093300265, "3": 0.01864132851500914, "1": 0.0076147912957756445, "2": 0.003324112692121454}, "score": 4.558474643129983}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9841254797389173, "4": 0.013021901608320464, "3": 0.0024771093086441566, "1": 0.0002806621289941577, "2": 8.335808107148736e-05}, "score": 4.9806509347111945}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9838537795401179, "5": 0.014387406552543357, "4": 0.0015344280089402125, "2": 0.0001611648183758727, "3": 6.141951128003157e-05}, "score": 1.0624370265625254}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.42375304689527243, "5": 0.16327447477674983, "3": 0.14865629241900488, "1": 0.13791638269088421, "2": 0.12639129099489022}, "score": 3.348080903014451}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9965019249700944, "1": 0.002680869759455198, "3": 0.0007629307431000875, "4": 5.0684014142237435e-05, "5": 3.5028171963324446e-06}, "score": 1.998193937305134}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9703122471562334, "2": 0.02961514183407341, "3": 6.778070435887207e-05, "5": 2.8897082861010614e-06, "4": 1.8097605757993796e-06}, "score": 1.0297676952523631}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983988233533201, "4": 0.0015994742459775734, "3": 1.31324025192896e-06, "1": 0, "2": 0}, "score": 4.998397898650044}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7801067809612484, "4": 0.21799978553018995, "2": 0.0011862360118700854, "3": 0.0007067645319121858, "1": 0}, "score": 4.7770278808313}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9871902113001075, "4": 0.012775589489050275, "3": 3.2258112369947835e-05, "2": 1.329830589712045e-06, "1": 0}, "score": 4.987155896943253}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5739448312996923, "5": 0.41106332538167684, "3": 0.014294513309391563, "2": 0.0006776761764324612, "1": 1.912953657203013e-05}, "score": 4.395356278393513}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9367626661712192, "4": 0.056946286359701725, "1": 0.0034684759118329823, "3": 0.0018125178917025497, "2": 0.0010042181504400242}, "score": 4.922541667748973}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6326539555596095, "2": 0.28513121533015073, "4": 0.07800438000179095, "1": 0.0025199114927504985, "5": 0.001690253096529828}, "score": 2.7912137884755195}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.978138063194677, "4": 0.02183606540028544, "3": 2.4298571387108042e-05, "2": 3.528086482266953e-07, "1": 0}, "score": 4.978114252329838}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7054195265747608, "5": 0.23879412498659958, "3": 0.053560951135450084, "2": 0.002185405902396671, "1": 3.886668892623455e-05}, "score": 4.180745965266708}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"3": 0.9858148982229414, "2": 0.012793935620167902, "4": 0.001347480805243275, "5": 4.15518297636281e-05, "1": 1.2746358856779612e-06}, "score": 2.9886340898108097}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9982378374348327, "3": 0.0017323740984295074, "4": 2.683893302011224e-05, "5": 2.7714081764230306e-06, "1": 0}, "score": 2.001794366508622}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9227531346535391, "3": 0.03516289752015218, "5": 0.02832270780908038, "1": 0.01160277482991978, "4": 0.0021566676568733002}, "score": 2.1128417865246014}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9129344328739504, "5": 0.08568733048112498, "4": 0.0012386663529107736, "3": 0.00013858218705425674, "1": 0}, "score": 2.2596781629255314}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9949205529428717, "2": 0.005061681695549392, "5": 7.510165914166308e-06, "3": 5.698235456985727e-06, "4": 3.7437454142184863e-06}, "score": 1.005114354225431}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9308850581134055, "5": 0.05556530407165565, "3": 0.013537102905666523, "2": 1.215249572264645e-05, "1": 0}, "score": 4.0420039122374085}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6796264160110722, "5": 0.3153294543152109, "3": 0.005027522303635538, "2": 1.5623396368888638e-05, "1": 0}, "score": 4.310270990517337}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5998801642283649, "4": 0.39373381281439257, "3": 0.006373175659189126, "2": 1.1349311235217775e-05, "1": 0}, "score": 4.59348517897968}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7772693149361222, "4": 0.222082287805258, "3": 0.0006460294286716549, "1": 0, "2": 0}, "score": 4.776625124423679}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5836957312846541, "4": 0.39039167459139745, "5": 0.025607187632749346, "2": 0.00030329124787999135, "1": 0}, "score": 3.4413036920737023}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8468588374720862, "5": 0.11481249035653031, "3": 0.03500534902094689, "2": 0.003308591529304532, "1": 1.452176499246587e-05}, "score": 4.073146408332219}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.707634048193585, "5": 0.25980220174824636, "3": 0.03167910068206265, "2": 0.0008814870033711874, "1": 2.0475932068177136e-06}, "score": 4.22635423661489}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9967914359787009, "4": 0.0031891128637501634, "3": 1.667051446416866e-05, "2": 2.150369220722725e-06, "1": 0}, "score": 4.996771092964563}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8250467397581043, "1": 0.15286740000444118, "4": 0.021587945473654148, "2": 0.0002784541901272441, "3": 0.00021805068984053372}, "score": 4.365670096227043}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9353075961087342, "1": 0.056086513299433184, "5": 0.006294198140378218, "4": 0.0019198304579354892, "3": 0.0003914988421535447}, "score": 1.9670272289056192}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7468437020091702, "4": 0.20541396387220634, "2": 0.047407278842144254, "5": 0.00027182012923333604, "1": 6.307380558760744e-05}, "score": 3.1584242032377774}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6926314080538939, "4": 0.3057407372651527, "3": 0.0016196678202365668, "2": 5.960679937028423e-06, "1": 0}, "score": 4.691001357167723}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9505244823947931, "4": 0.04906990327725287, "3": 0.0004039210984270405, "2": 6.508445563354567e-07, "1": 0}, "score": 4.950120249998322}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.988838108373119, "1": 0.008750241316187943, "4": 0.0023671239120251104, "3": 3.5514375492488325e-05, "2": 7.385964854053022e-06}, "score": 4.962538663263357}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9487348678165195, "4": 0.045574373731676436, "1": 0.005414069233537882, "3": 0.00022982923070682715, "2": 4.334249480264375e-05}, "score": 4.932179424829968}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4307729611264923, "2": 0.30598741662983997, "3": 0.23990674347661972, "5": 0.019826616030580408, "1": 0.0035053370517319545}, "score": 3.1574282481832747}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9919908237421278, "4": 0.008007861758842732, "1": 0, "2": 0, "3": 0}, "score": 4.991992127714817}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6025976813719658, "4": 0.3403946497311524, "2": 0.02126565816781581, "1": 0.021060521710600986, "3": 0.014677957505185826}, "score": 4.482208545325228}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.44661685481272184, "5": 0.3781174376501254, "4": 0.16733861244166406, "3": 0.007872674023450031, "1": 5.163215090272634e-05}, "score": 3.476854698537535}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5467155445864722, "4": 0.29907814058068444, "5": 0.12294128442276196, "3": 0.017301617235962772, "2": 0.013958034314210397}, "score": 2.4375685606991335}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8366147577324436, "3": 0.06643091788991166, "2": 0.06571799463823108, "5": 0.030734852737385746, "1": 0.0005005595426256057}, "score": 3.831366112228389}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4559510599037247, "2": 0.39108314286630075, "4": 0.14676811304293477, "5": 0.004913957272381559, "1": 0.0012828167921482632}, "score": 2.7629470353898613}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9897778004843673, "4": 0.01020364264893853, "3": 1.7183223981859062e-05, "2": 2.1001014455309836e-07, "1": 0}, "score": 4.989761348958636}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8314113754286371, "4": 0.16630986068218606, "2": 0.001493044432975819, "3": 0.0007675338309965967, "1": 1.7206471412404424e-05}, "score": 4.8276069436719276}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5526970265609901, "4": 0.4261472649839705, "3": 0.019541305948100277, "2": 0.0016060935738387947, "1": 7.187177661084e-06}, "score": 4.52992256637575}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9328787627874336, "2": 0.06704087975884152, "3": 7.949090065694914e-05, "4": 7.12957518253016e-07, "5": 1.251574865803566e-07}, "score": 1.0672025029737655}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9895801294311559, "3": 0.008164934292914408, "1": 0.0013886128218987843, "4": 0.0008624032407410372, "5": 3.912773892794858e-06}, "score": 2.0085128663375067}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9431627535401067, "3": 0.03387533874431815, "1": 0.02226006083966241, "4": 0.0006918066838311499, "5": 9.908644500069552e-06}, "score": 2.0130286189197015}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8301603118788129, "5": 0.11682683304485203, "4": 0.05174990927387661, "3": 0.0008847910876280872, "2": 0.00037265432896476216}, "score": 1.6247027326113401}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9981714466444742, "2": 0.0018168955065500033, "3": 1.1193727289442188e-05, "4": 3.707844279338369e-07, "5": 1.230639128329334e-07}, "score": 1.0018408875153408}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6676607858741692, "2": 0.3308061912553614, "3": 0.0014966833783844394, "4": 2.8569238383137652e-05, "5": 7.705123968223141e-06}, "score": 1.3339161079710196}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9307995286001829, "4": 0.06890117826639262, "3": 0.0002951228050332685, "2": 2.921968572994716e-06, "1": 4.892535376181971e-07}, "score": 4.9304978004441145}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7678950183767451, "2": 0.23183921184033957, "3": 0.0002637148901367263, "4": 1.3466534083398253e-06, "5": 7.086961242225715e-07}, "score": 1.2323735162591976}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6908813829052702, "2": 0.30737422493824895, "3": 0.0016875238533482675, "4": 3.696786633860437e-05, "5": 1.962895079817835e-05}, "score": 1.3109387764626774}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9833117556145231, "4": 0.016677429510703983, "3": 9.738621306203789e-06, "1": 0, "2": 0}, "score": 4.983303075276561}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.48761315629594676, "3": 0.3720179400243172, "2": 0.13752135016527323, "5": 0.0014725501283439797, "1": 0.0013749783409830413}, "score": 3.3502869584783794}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6162237443808848, "4": 0.27913356056615973, "2": 0.10441566154352179, "5": 0.0002204358136525219, "1": 6.5570877114957034e-06}, "score": 3.1751456635868474}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7007126432685429, "4": 0.2954050540078211, "3": 0.0038811180874131134, "2": 6.631875539255037e-07, "1": 0}, "score": 4.696830562167391}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9961818168689965, "5": 0.0037171129526744977, "4": 0.00010078651409677358, "2": 1.985821437503798e-07, "1": 0}, "score": 3.00753481447838}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9254602385685672, "4": 0.07452536065849928, "3": 4.3732290572997025e-07, "1": 0, "2": 0}, "score": 4.925472724037795}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6937841429981841, "2": 0.2256369020089696, "5": 0.03872588652914967, "4": 0.025641547341964884, "3": 0.01620990182012942}, "score": 1.4898856870644}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8280868075963547, "1": 0.16401944354240638, "3": 0.007604338038436259, "4": 0.00027739030506259446, "5": 1.2025345627185691e-05}, "score": 1.8441757518953383}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8218660363645368, "3": 0.12228581846043382, "1": 0.02947431125271492, "4": 0.02558536424920407, "5": 0.0007883786998371506}, "score": 2.146347385119339}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8847770735488402, "5": 0.06803474829405094, "3": 0.03719359908931045, "2": 0.009859478522014974, "1": 0.00013456422010186007}, "score": 4.010718505249016}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9056361808312178, "3": 0.08237325252842136, "4": 0.008757749617639619, "1": 0.0030710891755292326, "5": 0.00016149522214187846}, "score": 2.097302170889519}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4201397226718127, "3": 0.365119821934096, "4": 0.17360374576523263, "1": 0.039806542331987466, "5": 0.0013300368903870787}, "score": 2.676510970025152}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6179608580617162, "2": 0.3808904035349173, "3": 0.0011350102468816094, "4": 1.1940303876864634e-05, "5": 1.7469694746078715e-06}, "score": 1.3832032484847592}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5984572051795511, "2": 0.39589420599445174, "3": 0.003106499964152624, "4": 0.0022723653172627076, "5": 0.0002695957346722238}, "score": 1.410002737215647}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9910773522059741, "3": 0.008755549071670891, "5": 0.0001661135445696222, "2": 7.423581710026384e-07, "1": 0}, "score": 3.991409077670512}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9295000202822835, "4": 0.066015309614441, "3": 0.004318434183296478, "2": 0.00015771688489592194, "1": 6.482651170639112e-06}, "score": 4.924848587722468}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.9244778567844447, "4": 0.06861763550202551, "2": 0.006011373624866041, "5": 0.0008918389419846967, "1": 6.421197655204203e-07}, "score": 3.0643886975691506}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7629893926170636, "5": 0.12320401982072957, "3": 0.10592446851941663, "2": 0.007513744767508238, "1": 0.0003665951325223222}, "score": 4.001152278418797}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9728689474741045, "4": 0.027054876842874956, "3": 7.402046122052056e-05, "2": 1.4518513831537674e-06, "1": 0}, "score": 4.97279270754373}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6989635108795141, "4": 0.29590278726565783, "3": 0.004534500249745082, "2": 0.0004580088733092958, "1": 0.00013798107774478312}, "score": 4.693101275651421}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5475219099054706, "4": 0.44831202707336854, "3": 0.004121061925188769, "2": 4.161894856717071e-05, "1": 0}, "score": 4.543319447669607}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5085481386649073, "3": 0.44523339106549104, "4": 0.044518386293876305, "1": 0.0012818749091633012, "5": 0.00041772576722955634}, "score": 2.534241724244437}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5394730765380127, "1": 0.46013854502918167, "3": 0.0003860423806871986, "4": 2.085362201614459e-06, "5": 2.062421238200364e-07}, "score": 1.5402522663675078}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7192431862537074, "4": 0.26490381000571855, "3": 0.01579617589824933, "2": 5.4809775219512386e-05, "1": 9.38215659675724e-07}, "score": 4.703335335655719}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.727715240838492, "4": 0.27006292272645743, "3": 0.0021850119092320193, "2": 2.609971926039974e-05, "1": 5.870662902037569e-06}, "score": 4.72546393900821}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9997805140805595, "4": 0.000168450435967982, "5": 3.3150359392117255e-05, "2": 1.738455308093446e-05, "1": 0}, "score": 3.000217366710479}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9712898971473247, "2": 0.02868394845380283, "3": 2.4482940232395156e-05, "5": 7.732588347265079e-07, "4": 7.163449587812848e-07}, "score": 1.0287381616306566}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5357906888797238, "2": 0.40891314700530645, "3": 0.030769615058882583, "4": 0.021819255919641945, "5": 0.0027038516107188186}, "score": 1.5467274329013985}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8757158962482088, "5": 0.09175300871968499, "3": 0.029159477219589634, "2": 0.003360750388603248, "1": 1.0439707428421721e-05}, "score": 4.055840735484607}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9616636390640042, "4": 0.03818605050830675, "3": 9.34228122543412e-05, "2": 2.847702318163984e-05, "1": 2.0386553838430325e-05}, "score": 4.961459817334381}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4797192221915534, "5": 0.2640014984249091, "2": 0.1342431729694759, "1": 0.08146811192689497, "3": 0.040551398935090376}, "score": 3.71055461426421}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5279992424662058, "3": 0.21022237078769254, "2": 0.16785245995311618, "1": 0.08656866196316368, "5": 0.007356518412064515}, "score": 3.201722645980256}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.823615124588027, "3": 0.1748014361208701, "1": 0.001156347093391762, "4": 0.00042661354558711656, "5": 3.5913229736735335e-07}, "score": 2.1744994143716845}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9249978646119483, "1": 0.0697670809561976, "3": 0.0046120769130067185, "4": 0.0006124731213613342, "5": 1.0142246865282862e-05}, "score": 1.9361003457988282}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.958038078393549, "4": 0.030553281043464466, "5": 0.005352609928099904, "1": 0.00444027929605286, "3": 0.0016154178905831169}, "score": 2.0743395552541535}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9210860979315104, "1": 0.05944220399121749, "3": 0.013977603225105871, "4": 0.005435246528543747, "5": 5.856554521003405e-05}, "score": 1.9655815791938196}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9883285179067705, "3": 0.010905162260284934, "4": 0.0007544481523576935, "1": 9.281726344176682e-06, "5": 2.441911313727858e-06}, "score": 2.012412104410122}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9264245389595741, "3": 0.06808831271579363, "1": 0.004011652611476979, "4": 0.0014693727058224342, "5": 6.0612833886503275e-06}, "score": 2.067033593503705}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5748919896020847, "3": 0.24821623435263457, "2": 0.11842879323390583, "5": 0.043789706527796464, "1": 0.014672332522170949}, "score": 3.5146984301319453}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9043660481755386, "2": 0.06031547950403233, "4": 0.034832699241652214, "1": 0.00033126364137577615, "5": 0.00015346040071753938}, "score": 2.974161586150859}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3734186136602657, "4": 0.28540107708433743, "1": 0.2711162725820104, "2": 0.05286281591694585, "3": 0.01718173118569692}, "score": 3.43715146321827}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5477608841781056, "2": 0.4341128133784106, "3": 0.01698382259593333, "5": 0.0010258210116859316, "1": 0.00011610089040455}, "score": 3.1154675754668673}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9423036596830373, "4": 0.0443586078497841, "2": 0.012174410866168363, "3": 0.0011600843047454212, "1": 0}, "score": 4.916797721591795}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6642475518063273, "4": 0.29173048485787634, "2": 0.028825899723780076, "3": 0.015117428431156495, "1": 7.784421282153316e-05}, "score": 4.591245258945248}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7760301006917416, "2": 0.14317788081052163, "5": 0.04712616556712203, "3": 0.03202759833206031, "1": 0.00163790056585514}, "score": 3.7238290061428914}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8365068915798619, "5": 0.14506258630459468, "3": 0.017316993090728323, "2": 0.001112660816737576, "1": 3.485479592506049e-07}, "score": 4.125519291163883}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5281241448980301, "2": 0.4383968449992611, "4": 0.032605851919035436, "1": 0.0008352957535146703, "5": 3.781740921958053e-05}, "score": 2.5926140318902853}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.995513390737646, "3": 0.0024408090909274066, "4": 0.0018628149897437643, "1": 9.883922676227217e-05, "5": 8.416932620002917e-05}, "score": 2.0063201076745436}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5297272645893023, "4": 0.4617632108115914, "2": 0.005810390492289401, "5": 0.0026922053191309318, "1": 6.660946276142506e-06}, "score": 3.4613240326266905}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.8557833420146285, "1": 0.1382541390706012, "3": 0.0057901058849981575, "4": 0.00016985626135670884, "5": 2.4045422624133015e-06}, "score": 1.8678828728522154}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9820123954986048, "4": 0.01638698265302677, "5": 0.0009877120994486847, "3": 0.0006072977864324243, "1": 4.660529451867414e-06}, "score": 2.036339773436241}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3700721471703897, "3": 0.22386835517547168, "5": 0.2021278825423326, "2": 0.10616303504718512, "1": 0.09776672451197863}, "score": 3.472632305178035}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9899111879688294, "5": 0.009088433662472825, "4": 0.0008547450676322281, "3": 0.00014466280593114305, "1": 4.4611503150895965e-07}, "score": 2.0291190230830187}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9840975398290449, "1": 0.014459639404653196, "2": 0.0009594915972313944, "4": 0.0004392393838498289, "3": 3.163112353800993e-05}, "score": 4.938779703235802}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999413983091462, "3": 3.352242299195387e-05, "4": 1.3012319440104453e-05, "5": 1.0306796767646126e-05, "1": 1.1596306601121011e-06}, "score": 2.000089307875146}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.999797314573467, "3": 0.0001786523177298903, "5": 1.896809880838514e-05, "2": 7.090923961036831e-07, "1": 0}, "score": 3.999838896894534}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9725917971383019, "4": 0.027366826794752483, "3": 4.07389875081088e-05, "1": 0, "2": 0}, "score": 4.97255167774347}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.769210342169297, "5": 0.21819079337248243, "3": 0.01243486075025205, "2": 0.0001629114102994347, "1": 5.796247068459123e-07}, "score": 4.205428476245137}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9849353613088838, "4": 0.014843206398389345, "2": 0.0001870486153057961, "3": 2.7800126136327733e-05, "1": 0}, "score": 4.984539945721361}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.49725258632732167, "3": 0.22828496133474832, "4": 0.21476907453786134, "1": 0.04971348274870118, "5": 0.009979572751960064}, "score": 2.63804855156032}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9063672299436237, "4": 0.09327047252971561, "3": 0.00034436479909449814, "2": 1.6253488423693836e-05, "1": 1.254564572206835e-06}, "score": 4.905986979223596}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.45532428482045934, "3": 0.41421231435760675, "5": 0.10597934100966772, "2": 0.02439801505980656, "1": 8.568198195767032e-05}, "score": 3.6427138209736882}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5031965146455306, "5": 0.23733078349424713, "4": 0.20469262813140351, "2": 0.02866611831861777, "3": 0.026108613498452934}, "score": 2.6442931473556035}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9873235941501188, "4": 0.012334580974842472, "3": 0.00015754743034279993, "1": 0.00011409330265164698, "2": 6.829110733073195e-05}, "score": 4.986689052433786}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9881665747699618, "4": 0.01181606302379421, "3": 1.600801537861833e-05, "2": 2.4297749768816964e-07, "1": 0}, "score": 4.988151178846387}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8876157088160809, "4": 0.11009340908869426, "3": 0.002234511596170661, "2": 5.457667305109916e-05, "1": 0}, "score": 4.885273631900668}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9109985485250611, "3": 0.07533965168275755, "1": 0.011961665312225837, "4": 0.0016620998601961378, "5": 3.8004841441428765e-05}, "score": 2.0668162026049224}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.36534721631575773, "2": 0.35859659970318325, "3": 0.24839923714559825, "5": 0.015502794205209752, "1": 0.012153573952266643}, "score": 3.0134490649011387}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9854276584694945, "2": 0.0144837173776059, "5": 5.072980247732987e-05, "4": 3.7366387036290835e-05, "1": 0}, "score": 2.985655101040804}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9387063490495798, "4": 0.05214668845161565, "3": 0.006622164491576567, "5": 0.0024299441632016448, "1": 9.451925382856424e-05}, "score": 2.118110894149332}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5314077827588153, "4": 0.22093509685185414, "1": 0.2190018065747257, "2": 0.018546768684649263, "3": 0.01009712044742705}, "score": 3.827209731143947}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6278088109675644, "1": 0.35621948756774563, "3": 0.01448228066410422, "4": 0.0014538205872821602, "5": 3.553547729814667e-05}, "score": 1.6612770187752448}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9909432903119394, "4": 0.009054870402568835, "1": 0, "2": 0, "3": 0}, "score": 4.990945112942908}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999270948117124, "4": 7.149393049852727e-05, "3": 8.372609892061808e-07, "2": 6.419329955496315e-08, "1": 0}, "score": 4.999926638930225}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963002488073517, "4": 0.002073485025813167, "1": 0.0016065520183616885, "3": 8.230843974426889e-06, "2": 5.983529181198804e-06}, "score": 4.991465847689327}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8153173377942567, "5": 0.10576917009398877, "4": 0.07504636173193577, "2": 0.0027744032498731703, "3": 0.0010917776932435018}, "score": 1.6531743443558178}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8104324944884723, "4": 0.18948422562668704, "3": 7.811253614337094e-05, "2": 3.6874145848393804e-06, "1": 0}, "score": 4.810348206385114}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9938302203412246, "4": 0.0049676842158921835, "1": 0.0011177304874411106, "3": 5.531474767995283e-05, "2": 2.770809359234896e-05}, "score": 4.990367627130462}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999385375988907, "4": 5.3136525694577104e-05, "1": 6.8665826935931495e-06, "3": 6.405209546907336e-07, "2": 3.936502548160005e-07}, "score": 4.999916935115544}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9850711380966208, "4": 0.014898347175536666, "3": 1.5271167264075627e-05, "1": 8.17817939475407e-06, "2": 5.935015014991175e-06}, "score": 4.985020575795077}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999547484278832, "4": 4.305268326486666e-05, "1": 1.9271662331304353e-07, "3": 1.8367774512421837e-07, "2": 0}, "score": 4.999955809014215}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9223987178900613, "1": 0.04199752462229752, "3": 0.035011759087176283, "4": 0.0005889937415034232, "5": 2.6786034500213123e-06}, "score": 1.9942002558671974}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5336855879688571, "3": 0.44207143160316953, "4": 0.023427945899061258, "1": 0.0007887682551271052, "5": 2.610961292873112e-05}, "score": 2.4882169604694386}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8353896970077184, "3": 0.09489718847410582, "5": 0.04603726968467537, "2": 0.019094905638560592, "1": 0.0045677771173163}, "score": 3.89924561244443}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.44763966025583246, "3": 0.332953978917947, "4": 0.21410415002327024, "1": 0.0042788559779053615, "5": 0.001020705728750783}, "score": 2.7599475533470814}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8871671856925293, "3": 0.08218357618380764, "5": 0.0267656106541023, "2": 0.003543302773265329, "1": 0.0003373272603034648}, "score": 3.9364832567554813}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9291384593434027, "1": 0.07018265347364569, "3": 0.0006758424981299101, "4": 2.9537086727344007e-06, "5": 5.3382172234937495e-08}, "score": 1.9304992539755368}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3630896520014634, "4": 0.3305729228514886, "3": 0.2570687037619834, "1": 0.04642630789160855, "5": 0.0028420007085312297}, "score": 2.880314607079545}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.8409133469912106, "5": 0.14527428539707868, "4": 0.012265976348455982, "2": 0.0009142491780299952, "3": 0.0006302657513394355}, "score": 1.6200710147746482}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7066212859793498, "1": 0.17603222572405772, "5": 0.06173634262506024, "3": 0.03983094325680827, "2": 0.01577680114331973}, "score": 3.4622538286349354}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9818375716111445, "2": 0.017701445076408445, "3": 0.00043242355442046784, "4": 2.7356620296903306e-05, "5": 8.891187796078843e-07}, "score": 1.0186519243783165}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9837327493577049, "2": 0.016213241403869677, "3": 5.1953888105260884e-05, "4": 1.7024536907958033e-06, "5": 2.3513030196986934e-07}, "score": 1.0163231989846837}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9726158214249938, "4": 0.027104898797432827, "1": 0.00020839463337002774, "3": 6.386398311568754e-05, "2": 6.4735688618840065e-06}, "score": 4.971914358616791}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9391513092912538, "4": 0.04211436858358509, "3": 0.018671499661296866, "2": 4.78385145107832e-05, "1": 1.3582844436475048e-05}, "score": 4.920344673567074}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9934067589267415, "1": 0.005158323269845352, "4": 0.0014253994339687886, "3": 7.637662172322582e-06, "2": 1.4016464172254115e-06}, "score": 4.97792181664626}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997421506688544, "4": 0.0002328504863160893, "1": 2.378353555696826e-05, "3": 4.7199945784263524e-07, "2": 0}, "score": 4.999671071128044}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7964012318661778, "5": 0.1980328406841555, "3": 0.005532480559045309, "2": 3.313514686869751e-05, "1": 0}, "score": 4.192434149821517}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8957519552426129, "4": 0.10380005275639961, "3": 0.00044445755361486813, "2": 3.002605939053211e-06, "1": 0}, "score": 4.895301968635803}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9945296451821654, "2": 0.0050467873825650305, "4": 0.0003787444707223991, "5": 4.347819543097477e-05, "1": 1.177445849263427e-06}, "score": 2.995416557820404}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.999699260311249, "4": 0.0002713217966561652, "3": 2.2027938025719847e-05, "1": 3.912593909335443e-06, "5": 3.2767843419838673e-06}, "score": 2.0005705894049015}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8350036106574266, "4": 0.16484965537556606, "3": 0.00014361980399934938, "2": 2.3562822472693123e-06, "1": 0}, "score": 4.834855911010166}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5314092175617657, "4": 0.45035816075477597, "2": 0.011002423634982515, "3": 0.00690110317309292, "1": 0.000328053779870756}, "score": 4.501519627908929}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9488519441787041, "4": 0.051030540099594464, "3": 0.00010137571424298784, "1": 8.259012744767527e-06, "2": 7.4197291807669645e-06}, "score": 4.94871138957573}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9680029995516295, "1": 0.031877224171771, "4": 0.00010272366902080859, "2": 8.451234775437763e-06, "3": 7.771502813465823e-06}, "score": 4.872347376998861}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6310134003365102, "5": 0.3098227869375952, "2": 0.041621987736117715, "4": 0.017298646803302297, "3": 0.0002375688694246031}, "score": 2.333291692491078}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9952013657111325, "4": 0.0046356641502131885, "2": 8.236450322238142e-05, "1": 5.195575847889918e-05, "3": 2.4852356026407935e-05}, "score": 4.9948596950737345}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7378140137731598, "2": 0.26211301847719515, "3": 7.211914607751024e-05, "4": 4.75447201015526e-07, "5": 0}, "score": 1.262258780974487}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9032384375295565, "2": 0.09671420400285505, "3": 4.5480540718660864e-05, "4": 1.5535747377517568e-06, "5": 1.8737104277990602e-07}, "score": 1.0968105885538966}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8797027171542664, "4": 0.11623837959316004, "3": 0.004046749146743679, "2": 1.0601728543491874e-05, "1": 0}, "score": 4.875636123868065}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9997087938087562, "5": 0.00016433295086268473, "3": 0.00012598975044451346, "2": 5.001368879970143e-07, "1": 0}, "score": 4.000037342940957}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9095506614922271, "3": 0.07474610313825174, "4": 0.013900728919064001, "1": 0.0012248033236472655, "5": 0.000577384231845952}, "score": 2.1030549432119727}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5720348859723331, "3": 0.4138579955146906, "4": 0.014069153122019618, "5": 2.1184452880834663e-05, "1": 1.6590289560437218e-05}, "score": 2.44204334910272}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9781308817313803, "3": 0.019758839858507547, "4": 0.002079260452864056, "1": 1.8552407369493367e-05, "5": 1.2467927636675895e-05}, "score": 2.0239362120828615}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.75623746876687, "2": 0.24230069083696973, "3": 0.0014269371284606285, "4": 3.0682871213696985e-05, "5": 4.024857707067582e-06}, "score": 1.245262761096741}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6458564845629645, "4": 0.2629391085596259, "3": 0.0839377018446382, "5": 0.004741187723906124, "1": 0.00252513942489263}, "score": 2.6215145775711135}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8108472097213656, "5": 0.09615977000432929, "3": 0.07478082328994438, "2": 0.018175653504097895, "1": 3.2951130106048754e-05}, "score": 3.9849287321745996}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5109668825389823, "4": 0.31265297799568736, "2": 0.1680541382504439, "5": 0.00722580523487567, "1": 0.0010983579359414048}, "score": 3.156854022647718}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9886193610400161, "2": 0.011363310396473088, "3": 1.63793199089735e-05, "4": 7.203021933536427e-07, "5": 1.2106648251077252e-07}, "score": 1.0113987154384367}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6054885052904417, "3": 0.3747435850841918, "5": 0.016605239514795058, "2": 0.0031565645831449778, "1": 5.595571928870862e-06}, "score": 3.635531552685838}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9692087471080131, "5": 0.023555084016833608, "3": 0.007223327931018647, "2": 3.5236083287811145e-06, "1": 0}, "score": 4.016324860973369}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.7402521037938126, "4": 0.15451317673041526, "2": 0.10489638768172799, "5": 0.00020965987146584773, "1": 0.00012851691860499983}, "score": 3.0497790826703643}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8457582472202163, "3": 0.15146960518535652, "4": 0.0014000891021405985, "1": 0.0013690420736797194, "5": 2.9377898823784602e-06}, "score": 2.152909566708689}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8887638449350771, "4": 0.11107455905091557, "3": 0.00015093051388627288, "2": 4.397290509561902e-06, "1": 3.0761153716065836e-06}, "score": 4.888597727981746}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.997346418288766, "4": 0.0021165201026194435, "1": 0.0004839496430236944, "3": 4.195482977390055e-05, "2": 8.605896070680492e-06}, "score": 4.995837943359122}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8727406904227771, "4": 0.11888945109941519, "2": 0.007549099457406445, "3": 0.00044251464412326983, "1": 0.00037742661708483}, "score": 4.856068397070389}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8229416746619026, "5": 0.16755850585793916, "4": 0.005751325091654762, "2": 0.003535672702503542, "3": 0.00020842693704166987}, "score": 1.69144356400419}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8461484770397135, "3": 0.10129887230707257, "2": 0.03905724845794193, "5": 0.013489639940011003, "1": 5.708530060069868e-06}, "score": 3.834059136211668}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8408417883102467, "4": 0.15851952613051606, "3": 0.000569142907406767, "2": 6.917354957395573e-05, "1": 1.7212773334907554e-07}, "score": 4.8401339474054765}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9881823989021065, "1": 0.0076424702264010266, "4": 0.003874020199078326, "2": 0.00025315211622851155, "3": 4.6870784892982026e-05}, "score": 4.964702862581632}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9918961546394782, "1": 0.006160603718432277, "4": 0.0017398367360749096, "2": 0.0001394511775055401, "3": 6.322820972440706e-05}, "score": 4.973072918902127}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7418403801858026, "5": 0.21932774837170832, "3": 0.031233926097834864, "2": 0.00758888956992804, "1": 8.764965287084524e-06}, "score": 4.172889798516142}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6821963222680704, "2": 0.2281726499417602, "4": 0.08913344055922942, "5": 0.0003459757057386125, "1": 0.00015164838096741413}, "score": 2.8613494503770838}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5463433034101771, "3": 0.4102425249077491, "2": 0.040003725168178225, "5": 0.003393444828316232, "1": 1.6822647733891225e-05}, "score": 3.5130929144662133}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9904201860946193, "4": 0.009562558138546168, "3": 1.6898089327011825e-05, "1": 0, "2": 0}, "score": 4.990403642250398}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6531368764212694, "3": 0.19469325699456275, "2": 0.12248504966454629, "5": 0.023780841534859647, "1": 0.005903576058923565}, "score": 3.5664065838893793}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8435877091560104, "2": 0.14418217136797284, "4": 0.012029572329018575, "5": 0.00019999463835511686, "1": 3.223364374702485e-07}, "score": 2.8682467152389366}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9705851645030777, "1": 0.025292567528136994, "3": 0.0041086449528734675, "4": 1.3044095222032812e-05, "5": 4.3189039334639733e-07}, "score": 1.978843458175708}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9377371623092606, "2": 0.06193428967007035, "3": 0.0003134558616463816, "4": 1.2204802941117516e-05, "5": 2.938903515764074e-06}, "score": 1.0626095681888872}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8282011908453452, "5": 0.1300335870465114, "3": 0.04155362155945332, "2": 0.0002108488567262637, "1": 0}, "score": 4.088058333966348}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9601391664256025, "4": 0.024391909000842257, "5": 0.00694754443876718, "3": 0.006740125729523068, "1": 0.001781036643872451}, "score": 2.0745855566454914}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9968503055278941, "4": 0.0031467084782552477, "3": 1.218227042566485e-06, "1": 0, "2": 0}, "score": 4.996850849500695}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7151205994156515, "5": 0.1677536071888983, "3": 0.11271921224682649, "2": 0.004405531801910354, "1": 6.822586491822941e-07}, "score": 4.0462213015295925}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6388541486701091, "3": 0.3206544870110207, "4": 0.04016325725260799, "5": 0.00017743698964276804, "1": 0.0001505209922670905}, "score": 2.401362851329819}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9821128781833934, "4": 0.01786745102292936, "3": 1.4570290496017741e-05, "2": 4.580007144064436e-06, "1": 0}, "score": 4.982089659052385}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6765841830600788, "4": 0.30393372840768734, "2": 0.015484697512104172, "3": 0.003995075904777859, "1": 0}, "score": 4.641621197558178}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8791025600528187, "5": 0.0899564962963481, "3": 0.025081516463337485, "2": 0.005858703181318478, "1": 0}, "score": 4.053157611956813}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6031603121260573, "1": 0.39560444230974606, "3": 0.001210828188741, "4": 2.2899488131274264e-05, "5": 1.2497387856095673e-06}, "score": 1.6056558283288012}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.988994795756664, "2": 0.010971009337935333, "3": 3.268599039990774e-05, "4": 1.1462555173452166e-06, "5": 2.6857114124788667e-07}, "score": 1.0110408954086716}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9788845576950749, "4": 0.020524278017984236, "3": 0.000533761952622523, "2": 3.850270728699818e-05, "1": 1.8155645477968026e-05}, "score": 4.978220051169118}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7826367980955805, "5": 0.2035995305611958, "4": 0.0074368775676176505, "2": 0.005461033070890123, "3": 0.0008600474464051463}, "score": 1.8438947042997693}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9777824563109837, "5": 0.01203483401138105, "2": 0.008465609192075434, "4": 0.0011544237237462913, "3": 0.0005612053930097381}, "score": 1.0611907172289705}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9587366488287309, "3": 0.03703610616000686, "1": 0.0026728188885351343, "4": 0.0015469088958169066, "5": 7.373404633651028e-06}, "score": 2.037479230667355}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4396765966209791, "2": 0.42377912122241634, "4": 0.13057193213199053, "5": 0.003510695896655834, "1": 0.0024614016866159466}, "score": 2.70889132584179}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9645055426466885, "3": 0.03288844166863084, "4": 0.0025782244877445683, "5": 2.699985668329888e-05, "1": 7.311274808452912e-07}, "score": 2.0381251613823106}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8571379284375347, "5": 0.07930583275656584, "3": 0.05537738397922288, "2": 0.00814880816374845, "1": 2.930615487524703e-05}, "score": 4.007542919570813}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9759115252857605, "3": 0.022959777461984982, "2": 0.001124054096623714, "5": 3.246412556693233e-06, "1": 1.2070478172767523e-06}, "score": 3.9747917348319843}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8535111610770874, "3": 0.144050607525184, "4": 0.0023425354747412105, "5": 9.328893995095079e-05, "1": 1.5004477415950493e-06}, "score": 2.1490141799333915}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5593169902006205, "5": 0.381092367063535, "1": 0.053699467162638535, "3": 0.004809814793863804, "2": 0.001072754113030764}, "score": 4.213040476123983}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993775864197441, "4": 0.0005889277778984059, "1": 2.5630128601110606e-05, "3": 4.610602570783283e-06, "2": 0}, "score": 4.999299328228826}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9913868089116187, "5": 0.0073577507321024565, "4": 0.001115876259226311, "2": 0.0001168396588796607, "3": 2.1316353710614547e-05}, "score": 1.0329381504520878}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9997573939136172, "5": 0.00012331567831970803, "4": 0.00011229884289145336, "3": 4.061951641390159e-06, "2": 2.397037399513092e-06}, "score": 1.000840680630362}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.859384700789065, "1": 0.11887800259652857, "3": 0.021550251326883332, "4": 0.00018530359942685822, "5": 1.6746740644668824e-06}, "score": 1.9030478734542493}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6377328906471341, "3": 0.23551716045648927, "1": 0.08094049693544121, "4": 0.04406042463505206, "5": 0.001748841692836838}, "score": 2.2479440838962783}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9289408108069841, "3": 0.032366096770841665, "1": 0.030627885320751728, "4": 0.007906034107408599, "5": 0.00015915547552837708}, "score": 2.0180277464073106}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9951390293446669, "5": 0.002402283825856516, "4": 0.0019568201415074366, "3": 0.0004994005893515771, "1": 2.3771601429007564e-06}, "score": 2.011617516223037}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7067560656431919, "3": 0.21065486408201248, "4": 0.08137423332525737, "5": 0.000743428472840427, "1": 0.0004712279550646114}, "score": 2.375162455920923}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.687430235655892, "1": 0.26967433895204995, "3": 0.03928401837260506, "4": 0.003416954574187922, "5": 0.0001942621543534205}, "score": 1.7770263326021285}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.9738383229328785, "2": 0.023254758528451505, "4": 0.0028752452615677044, "1": 2.1780641222645932e-05, "5": 9.717151869219239e-06}, "score": 2.9795963561738965}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9390909651234821, "4": 0.05503659232354558, "5": 0.004279414832988521, "3": 0.0015890848412432675, "1": 3.6651547491899744e-06}, "score": 2.1244968834083218}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9841287086599134, "4": 0.014450508134856484, "3": 0.0013828799971788506, "5": 3.769715238188953e-05, "1": 2.028654267801536e-07}, "score": 2.0303967849555837}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9142092216591533, "4": 0.07095705812898247, "3": 0.014543447942737453, "5": 0.0002896144506628283, "1": 4.0418424943194563e-07}, "score": 2.1573260432717087}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7828069540035447, "3": 0.16721818872628452, "5": 0.030179647669945284, "2": 0.019614501772001677, "1": 0.0001805716330348816}, "score": 3.8231907164199797}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9669502293352616, "4": 0.030027354383061672, "1": 0.0024978240652581752, "3": 0.00043318334067751546, "2": 9.11364248419183e-05}, "score": 4.958841562186372}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9279151440296646, "4": 0.07179496002712515, "3": 0.00015826337220570036, "1": 0.00011124851336705204, "2": 1.938942002875524e-05}, "score": 4.9273852786895755}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.42633557844102005, "4": 0.3333077305393415, "5": 0.14665295994875105, "3": 0.07990860778780551, "1": 0.013793907083557018}, "score": 3.172690467854774}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9773087768162898, "4": 0.022577668063907774, "2": 6.118380669161952e-05, "3": 5.183966334799914e-05, "1": 0}, "score": 4.9771350890331965}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"1": 0.885857550074756, "2": 0.11410136032132857, "3": 4.068752595844963e-05, "4": 2.552728152394895e-07, "5": 7.841739964236223e-08}, "score": 1.1141838226700636}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9186060233630297, "2": 0.08135429094470793, "3": 3.933766897749526e-05, "4": 1.1415507567508616e-07, "5": 0}, "score": 1.0814333277925565}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7830585494411456, "5": 0.20170609829441907, "3": 0.012034978430255697, "2": 0.002237054351872938, "1": 0.000961561531176185}, "score": 4.182312647063613}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9892127690072724, "4": 0.01069299419592263, "3": 9.149154448068751e-05, "2": 2.0351928031397226e-06, "1": 0}, "score": 4.989117909409774}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7567308401500782, "2": 0.12403723204726011, "3": 0.11700860498599204, "5": 0.002219787074689177, "1": 2.920630617803411e-06}, "score": 3.6371277328954683}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5045038035349226, "1": 0.36313656621509494, "3": 0.10965049387767725, "4": 0.02209914630362036, "5": 0.000598094972340953}, "score": 1.7925040370023753}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8793320181796299, "5": 0.08611617691543284, "2": 0.02701307691615156, "3": 0.0075227839756733346, "1": 1.2913723175363673e-05}, "score": 4.0245285722666155}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7344492576217768, "3": 0.2447927120070912, "2": 0.01073709726187862, "5": 0.009968850475507876, "1": 5.108120176307745e-05}, "score": 3.743548443520579}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9944834294688776, "4": 0.005500881097658612, "3": 1.2372194280791446e-05, "1": 0, "2": 0}, "score": 4.994474356183898}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9960809237032434, "5": 0.0036435212083430466, "3": 0.0002719438355331859, "2": 5.210983715813252e-07, "1": 0}, "score": 4.003370545591573}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8144416927977641, "5": 0.16660902150920093, "3": 0.018521488137416144, "2": 0.00042649594444466043, "1": 9.822548901515003e-07}, "score": 4.147231641737575}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7904871167989118, "4": 0.19032217213216382, "1": 0.015658333683308327, "3": 0.002389727347715866, "2": 0.0011417067352301176}, "score": 4.738839671880246}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8413043280161956, "4": 0.15291103458676117, "2": 0.004762788323473126, "3": 0.00102119884869665, "1": 0}, "score": 4.830758092700129}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999747739361825, "4": 2.466685791863739e-05, "1": 0, "2": 0, "3": 0}, "score": 4.999975333128288}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9956811883061859, "4": 0.004309191411532663, "3": 4.298712494429333e-06, "1": 0, "2": 0}, "score": 4.995682188185941}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"1": 0.713234186630043, "2": 0.27823672468266186, "3": 0.007655848602806798, "4": 0.0008483078138550285, "5": 2.4631018368890422e-05}, "score": 1.2961919586318145}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8461293627615137, "1": 0.15299630625581245, "3": 0.0008700003012946628, "4": 4.211873488972969e-06, "5": 5.679804107103728e-08}, "score": 1.8478822787537863}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5748416715084383, "5": 0.3995627718844699, "3": 0.02409186854960417, "2": 0.0012901054754968489, "1": 0.00021329635953053745}, "score": 4.372250909851854}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5905126033795559, "2": 0.20004188687248298, "5": 0.15968880921676748, "3": 0.04428185409297075, "1": 0.005473961508957945}, "score": 3.6989010304006666}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7072179755966829, "4": 0.29048425610813683, "3": 0.0020136475500001066, "2": 0.00015474035108115885, "1": 0.00012904208067674472}, "score": 4.70450795944699}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8429549942577943, "3": 0.10061672325428189, "4": 0.029700241556234762, "1": 0.02434093689926105, "5": 0.002386953529442289}, "score": 2.142837151553235}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8381784782265984, "4": 0.13929466466093254, "3": 0.012179582436568465, "1": 0.008363571752549112, "2": 0.0019826835968333864}, "score": 4.796943625684488}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.985289692489414, "4": 0.014182825758230188, "3": 0.0005246616391537631, "2": 2.011346821169734e-06, "1": 0}, "score": 4.9847618045988575}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9700222079043855, "4": 0.029221767064542038, "5": 0.0005432869090219308, "3": 0.00021251329645593085, "1": 2.2658560871768948e-07}, "score": 2.060285681460894}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.48448275096911747, "2": 0.4242903798592081, "4": 0.08583100277937773, "5": 0.005393113591943932, "1": 6.35655555319411e-07}, "score": 2.672324885057282}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8872229281579376, "1": 0.07957639303734058, "3": 0.02817048726334802, "4": 0.0049904290048417045, "5": 3.9706009854609034e-05}, "score": 1.9586940679303675}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9939336073170063, "2": 0.0060652858901327315, "3": 1.0824971606817451e-06, "4": 1.1247499496260715e-08, "5": 0}, "score": 1.0060674847061222}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9932024614984085, "4": 0.006744067833398881, "1": 2.498389851478579e-05, "3": 1.9599882238218688e-05, "2": 0}, "score": 4.99311673563727}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6659919337510516, "3": 0.22736641496953525, "2": 0.07527712313228534, "1": 0.02313758332019686, "5": 0.008224333656663174}, "score": 3.560889775870405}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8294383035467232, "4": 0.16020128870971348, "3": 0.008723373034257468, "2": 0.0016355322376350508, "1": 0}, "score": 4.817445094225292}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8328690100673571, "2": 0.1669411706807954, "3": 0.00018243930784598712, "4": 4.584580272805887e-06, "5": 2.024072473732558e-06}, "score": 1.1673280283858456}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.533337823710836, "2": 0.26983327789137396, "4": 0.19407247639909564, "1": 0.0013788638720751447, "5": 0.0013766985515683275}, "score": 2.9242348027408345}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6815400719098016, "4": 0.3143819283128752, "3": 0.004067289792440051, "2": 9.353014062301316e-07, "1": 0}, "score": 4.677477533643003}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8210067975220311, "5": 0.17328041513249753, "3": 0.005706773364849282, "2": 2.9411114612841855e-06, "1": 0}, "score": 4.16756827446011}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6218257003691953, "4": 0.22857719317202282, "3": 0.1400674481343045, "5": 0.009329504255437542, "1": 0.0001999390475731309}, "score": 2.6250105425877734}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9936794179483333, "2": 0.0063169044059765405, "3": 3.6449004655348373e-06, "4": 2.748850279158016e-08, "5": 9.939550883949059e-09}, "score": 1.0063243164010038}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5702459043752168, "2": 0.4295682519234751, "3": 0.0001853847801806946, "4": 1.8435142176176698e-07, "5": 0}, "score": 1.4299396925865164}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7303997441419315, "2": 0.15998273113171485, "4": 0.10583838692342055, "5": 0.003334533464849508, "1": 0.00044389225229218404}, "score": 2.9516369037781467}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6440323314648521, "3": 0.3310404849689579, "5": 0.017844598885312184, "2": 0.007078257623070981, "1": 0}, "score": 3.672646182191319}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7638578708811155, "3": 0.18357431630270543, "4": 0.033587254981442424, "5": 0.010647363246165355, "1": 0.00833284453751956}, "score": 2.274358167505932}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7564666207441167, "1": 0.24111810579378518, "3": 0.0023896317605337134, "4": 2.3215811064838623e-05, "5": 2.3008866714332306e-06}, "score": 1.7613248304135827}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9465712593032778, "4": 0.05270671037219979, "3": 0.0007145668521719805, "2": 6.180236615066641e-06, "1": 0}, "score": 4.9458455457206805}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6997437656657274, "3": 0.19902795236023935, "4": 0.0774554148829174, "1": 0.017336988435850142, "5": 0.006435770559737287}, "score": 2.355909143841623}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6635119200238245, "4": 0.23075143194645278, "3": 0.0963367416224343, "5": 0.008860438708136294, "1": 0.0005391547082213607}, "score": 2.583881949681282}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9257761335400377, "1": 0.06669994170826475, "3": 0.006920946785482786, "4": 0.0005801478344031352, "5": 2.2537454236184146e-05}, "score": 1.9414488959721372}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9968959201487215, "5": 0.002570866184728073, "4": 0.00045379259659408133, "2": 6.381616690174137e-05, "3": 1.394396165051868e-05}, "score": 1.0117365661126458}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8122480135905742, "3": 0.1701369802858465, "1": 0.012637085429006843, "4": 0.004971127517079307, "5": 6.05668462001181e-06}, "score": 2.1674604432782814}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8972314396375746, "5": 0.09363956329771507, "3": 0.009054723714856494, "2": 7.118723779961273e-05, "1": 2.738536238050699e-06}, "score": 4.084434278845858}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8225782122351956, "5": 0.17520450278193062, "3": 0.0020266380334578705, "2": 9.592384140866029e-05, "1": 9.292758723351198e-05}, "score": 4.172707544403938}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9074424189944804, "2": 0.08121142822747651, "4": 0.011297128506787183, "1": 4.790948770442644e-05, "5": 6.723599499637894e-07}, "score": 2.929991195050254}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9881804185865634, "2": 0.011809197523272492, "3": 9.728780535411057e-06, "4": 2.8554762761349345e-07, "5": 1.851597261084462e-07}, "score": 1.0118302545476565}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6189836253747635, "4": 0.33910129870480643, "2": 0.039885824256732434, "5": 0.002012731750044105, "1": 1.6347771003107022e-05}, "score": 3.303208294601235}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.707520574020446, "4": 0.2683018570584417, "2": 0.019576729275214123, "5": 0.00459533003933886, "1": 5.427000341266085e-06}, "score": 3.2579049551657757}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6223734652374593, "4": 0.2552754552937162, "2": 0.11677645649624344, "5": 0.005225502570579364, "1": 0.00034778342982687234}, "score": 3.1482546352912997}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.596117043193442, "4": 0.37866073238895154, "3": 0.025215862959145338, "2": 2.8059034087154428e-06, "1": 0}, "score": 4.570897598285319}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.47575471128322394, "2": 0.3592870240654704, "3": 0.14746290888667732, "5": 0.0174930538448315, "1": 1.920448126383224e-06}, "score": 3.151450011785053}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9232439760437205, "4": 0.054402171969898855, "5": 0.012501966838145383, "3": 0.009851180335126383, "1": 6.39757908578574e-07}, "score": 2.1561607951905235}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6420509930626196, "4": 0.3070656839639271, "3": 0.04397143326021973, "2": 0.006909707306908789, "1": 1.4416676848420068e-06}, "score": 4.58425625296671}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.48091658205379706, "2": 0.33737210116633776, "5": 0.18065186456845278, "3": 0.0010590228877396053, "1": 0}, "score": 3.5048484267677456}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5093390368411128, "5": 0.2710843369661449, "2": 0.20636151935290295, "3": 0.013210124973107949, "1": 4.827016418035048e-06}, "score": 3.845136668257342}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9271307101113093, "1": 0.03742445167823279, "3": 0.03498577600334408, "4": 0.0004533635117868168, "5": 5.507614327358157e-06}, "score": 1.9984845739020975}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9985623494111412, "3": 0.0013348237744507253, "4": 9.905205875778802e-05, "1": 2.524372603432046e-06, "5": 1.0517511721505564e-06}, "score": 2.001533559077493}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4684125754247235, "3": 0.36393692839467895, "2": 0.12813556166237575, "5": 0.03579597578979615, "1": 0.0037188622658123746}, "score": 3.404431279822813}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9803798131131787, "4": 0.01757240157519567, "3": 0.0012768774163508167, "2": 0.0007702872967834516, "1": 0}, "score": 4.977562967777364}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.932517668677723, "5": 0.0632006179618345, "4": 0.004089083161290544, "3": 0.00013246594028963442, "1": 5.907622492640301e-05}, "score": 2.1978536251949063}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8710557040860899, "3": 0.101715935190137, "4": 0.015993797310480926, "1": 0.010989974839155817, "5": 0.000244560704427162}, "score": 2.1234472405256635}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7971660803746303, "2": 0.19010529045923702, "4": 0.008830770577975662, "5": 0.0038939235694432006, "1": 3.70670580115546e-06}, "score": 2.8265058742350733}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9629990198437018, "5": 0.03628893155673603, "2": 0.0004151314669786111, "4": 0.0002959142031142065, "1": 1.874068340670363e-07}, "score": 3.072458330127348}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9770008821721474, "2": 0.02267592930813552, "4": 0.00022164224167056646, "1": 5.5003320600485065e-05, "5": 4.6509730927790087e-05}, "score": 2.9775287250075477}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7664008218306932, "2": 0.21532680105191543, "4": 0.008866080172579617, "3": 0.00858206258371488, "5": 0.0008240577051376226}, "score": 1.262385443909587}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9151151267836652, "3": 0.08203223493512748, "1": 0.0023509377214812064, "4": 0.000500820552341448, "5": 8.612276203809926e-07}, "score": 2.0806855235164456}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9010929622032297, "3": 0.055203418404432075, "5": 0.04206292363784892, "2": 0.0016362569389258069, "1": 0}, "score": 3.9835869185009236}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9838937041526827, "4": 0.016077401926829746, "3": 2.83551184248561e-05, "1": 0, "2": 0}, "score": 4.983865879143224}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8108356146891713, "5": 0.18691647867531044, "3": 0.002242854262319858, "2": 4.561979170421235e-06, "1": 0}, "score": 4.184664591013063}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.987713035817842, "4": 0.012259776238334116, "3": 2.2728293497931755e-05, "1": 2.2476125364922905e-06, "2": 0}, "score": 4.987685749484936}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8326726010737738, "2": 0.16223024294931307, "3": 0.004370741083183085, "4": 0.000700392265912527, "5": 2.599005742005307e-05}, "score": 1.1731768677835364}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9896136218426103, "1": 0.008474619698972839, "4": 0.0018804159060216803, "3": 1.7202084321572096e-05, "2": 9.340255038939697e-06}, "score": 4.964158508317532}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9996986644806704, "4": 0.0002529891387500413, "1": 4.4415635482934145e-05, "3": 2.06159315056856e-06, "2": 0}, "score": 4.999565224320355}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9104263615690641, "1": 0.0889810992304951, "4": 0.0005569225367336, "3": 2.196718080523888e-05, "2": 1.2089297510861098e-05}, "score": 4.643437921984197}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9241868769577567, "1": 0.0617369414704881, "4": 0.0138703376644805, "3": 0.0001292471622925654, "2": 7.395501906862921e-05}, "score": 4.7387008467910325}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"4": 0.821625018403083, "2": 0.12335998386045668, "3": 0.03335276171513638, "5": 0.02055795722689304, "1": 0.001100329058303674}, "score": 3.737183202558933}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8035864402012391, "1": 0.1946605318086909, "3": 0.0012480973590729507, "4": 0.0004965630964877385, "5": 0}, "score": 1.8075790816546828}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9994802263291609, "3": 0.0005160492764738079, "1": 2.213866552244622e-06, "5": 9.400601259042769e-07, "4": 4.249930589660279e-07}, "score": 2.0005175056517013}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9961670317478086, "3": 0.0021234651923212294, "4": 0.0015729019342241243, "5": 0.00010999650119454936, "1": 2.6521389489387356e-05}, "score": 2.0055727376387105}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9297603353229709, "1": 0.06917260335667838, "3": 0.0010542285624001338, "4": 9.212392218515249e-06, "5": 2.31507493874926e-06}, "score": 1.9319069063336867}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9986200048702015, "2": 0.0013794147002987242, "3": 4.989320114883737e-07, "4": 2.892180581122363e-08, "5": 0}, "score": 1.0013804994023199}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9996088453709269, "4": 0.000217043014622671, "3": 0.00014840285334851032, "5": 2.478849310922773e-05, "1": 7.817420579360077e-07}, "score": 2.0006560727107465}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9618740327283993, "4": 0.037978221574890884, "3": 9.354452797563657e-05, "2": 5.2136618802425394e-05, "1": 1.4234031059778262e-06}, "score": 4.961672561326813}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9985491514997876, "4": 0.0010951243067617241, "3": 0.00029103558879674604, "5": 5.852731439273226e-05, "1": 6.012180880195134e-06}, "score": 2.0026508543598855}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8542752759115989, "3": 0.09434018878641777, "5": 0.03756002346156366, "2": 0.013822065700447533, "1": 2.207287879305854e-06}, "score": 3.9155690612441068}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7450120918970494, "2": 0.2547202486899104, "3": 0.0002627115226090558, "4": 3.849774433816699e-06, "5": 9.970608856426524e-07}, "score": 1.2552612350974253}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8053878792760817, "3": 0.08895699751543827, "2": 0.05952173137015984, "5": 0.026987029966616703, "1": 0.019146089267628508}, "score": 3.76154823690505}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9685414779999961, "4": 0.02715597997361793, "1": 0.003828028347943353, "3": 0.00042491037229400424, "2": 4.484111920962006e-05}, "score": 4.956547355602776}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5634195241426483, "5": 0.43565182115361056, "4": 0.0007083827521261602, "2": 0.00011730701502011339, "3": 0.00010124978251296819}, "score": 2.745055232489472}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9590766656189399, "1": 0.03883756618936955, "4": 0.002017299385377137, "3": 3.649614205811862e-05, "2": 2.8802193803235195e-05}, "score": 4.842472537555454}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6056041404159024, "3": 0.3489292846813507, "2": 0.026707640325425712, "5": 0.018645968919150872, "1": 0.0001123615231319477}, "score": 3.6159640870080016}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8955550458213141, "3": 0.08538338945283139, "5": 0.01204660983648404, "2": 0.00684559431035332, "1": 0.0001691797159619748}, "score": 3.912464476783118}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7514014996773771, "4": 0.24651597014291143, "3": 0.0020551591269353476, "2": 2.3860265832767737e-05, "1": 0}, "score": 4.749301250655824}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7395341633458465, "4": 0.2581452933634267, "3": 0.0017935112291241919, "1": 0.0004131868276909674, "2": 0.00011101274982055215}, "score": 4.736281151638656}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8666966050056701, "4": 0.1331159401560669, "3": 0.00016305418322026628, "2": 2.1956902569916695e-05, "1": 0}, "score": 4.8664917545086785}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5635544060168354, "3": 0.42564153673709326, "4": 0.010620523187734656, "1": 0.00016983282280993856, "5": 1.3676124263260949e-05}, "score": 2.446753789881094}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5306248524419768, "4": 0.30207462182310896, "2": 0.16520403388554616, "1": 0.0011168301829957066, "5": 0.00097947484733075}, "score": 3.136595902784949}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.89481144847208, "4": 0.10508357426922452, "3": 0.00010381417872302629, "2": 3.1526824155520306e-07, "1": 0}, "score": 4.8947077623006106}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9163669757409838, "3": 0.0608810693926918, "1": 0.01670190156289594, "4": 0.0060115539687799315, "5": 3.820962923127271e-05}, "score": 2.056316920970367}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9285059964481992, "3": 0.06965839881672711, "4": 0.001778927365443757, "1": 5.557783985024115e-05, "5": 1.1504423929976507e-06}, "score": 2.0731641233099674}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8758269790972143, "4": 0.12311831196884228, "3": 0.0010505801957929612, "2": 3.7231815493497777e-06, "1": 0}, "score": 4.874769307306789}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5730403189976702, "5": 0.4192132787791557, "3": 0.007627089204388528, "2": 0.00011765699365220877, "1": 1.5168799457267378e-06}, "score": 4.411346382184495}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.511482145683135, "4": 0.4739937940946929, "3": 0.00998019150465182, "1": 0.002987665397730277, "2": 0.0015560884661343268}, "score": 4.489426837265486}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9877369940758033, "4": 0.012129033957067806, "2": 7.620709418991417e-05, "3": 5.686002568602299e-05, "1": 5.827258507754371e-07}, "score": 4.987526289787538}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7116377109535322, "5": 0.26436601911742896, "3": 0.02074857311939987, "2": 0.002841011864353528, "1": 0.0004062905556543193}, "score": 4.236716643960949}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6469971302257245, "3": 0.22465897347884448, "4": 0.09621928246231146, "5": 0.02168966715092328, "1": 0.010434600748394812}, "score": 2.4717321022959218}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5067036616809188, "2": 0.4832861053880951, "3": 0.009302486955518026, "4": 0.0006035083388746168, "5": 0.00010425898645429762}, "score": 1.50411862949871}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9685744632102399, "4": 0.03027272914358381, "2": 0.0006147588997190055, "1": 0.0002845234165648292, "3": 0.0002526827016522689}, "score": 4.966239506640151}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975806595330304, "4": 0.0022808958420639895, "1": 0.00011511637324586995, "3": 1.5566070193900144e-05, "2": 7.115130393690613e-06}, "score": 4.997206159325627}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9621023962235967, "1": 0.03705945367013664, "4": 0.0007989435224423621, "2": 2.0292402561961547e-05, "3": 1.5842125420377753e-05}, "score": 4.850870222203479}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7517679498343668, "5": 0.17853057569899003, "3": 0.06840874579687065, "2": 0.0012857419940572922, "1": 6.4160557386009026e-06}, "score": 4.107531159106217}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9100671417956423, "5": 0.05984572967399471, "3": 0.02882832984955516, "2": 0.0012585726721530833, "1": 9.036308542619581e-08}, "score": 4.028499987256773}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9994907035354955, "4": 0.0004764184467952949, "3": 3.2029154237979405e-05, "1": 0, "2": 0}, "score": 4.999459522785938}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7788548337212858, "4": 0.19536452627398646, "3": 0.020190263413731056, "5": 0.005587088322816259, "1": 2.824511863436416e-06}, "score": 2.427677954756642}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8469722309927953, "4": 0.15063178953531053, "3": 0.00118572959722024, "1": 0.0011019859697023735, "2": 0.00010684397128695881}, "score": 4.842268051508673}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9991113271538098, "2": 0.0008867639791125592, "3": 1.876346543048875e-06, "4": 7.16477561486012e-08, "5": 0}, "score": 1.0008907315806153}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.728725733989096, "2": 0.26987162392458347, "3": 0.0013691735080275406, "4": 3.22346692448634e-05, "5": 8.836701300507492e-07}, "score": 1.2727103051426556}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.503471717600006, "4": 0.3033079963938387, "2": 0.18607058276891258, "5": 0.00541491876764483, "1": 0.001734377013661664}, "score": 3.1245985479013103}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9953572380942597, "5": 0.004631777848638777, "3": 6.824844507067753e-06, "2": 1.5086204907302283e-07, "1": 0}, "score": 4.004624669817331}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8143505211536834, "5": 0.10426449366553037, "4": 0.07807381138064748, "3": 0.002257967289165976, "2": 0.0010487332203260083}, "score": 1.6568470148703296}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5989352820655672, "3": 0.3356519899396082, "2": 0.0447445020959509, "5": 0.020555153312758583, "1": 0.00011284447665814932}, "score": 3.5950755333841737}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8577557531574729, "1": 0.13029532164311836, "4": 0.011741867566722797, "3": 0.0001384969852114705, "2": 6.720694281987009e-05}, "score": 4.466597508992486}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8010523085408413, "4": 0.19575965934808623, "3": 0.0018324672428956348, "2": 0.0008508803828191832, "1": 0.0005039270713829055}, "score": 4.796006902224909}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.721460824167883, "5": 0.27753267638200785, "4": 0.000898602840774024, "3": 5.685343030558286e-05, "2": 4.831874390592498e-05}, "score": 2.1129915719282013}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7884384935475872, "2": 0.2099924502712941, "3": 0.0014581737243359102, "4": 0.00010567956647513082, "5": 5.1307895615043046e-06}, "score": 1.21324637495286}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9453476051367226, "1": 0.03523432956195653, "3": 0.018869653165071158, "4": 0.0005342363040170176, "5": 1.4053683861556004e-05}, "score": 1.9847459553994768}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.864527806103099, "4": 0.13361924217428878, "3": 0.0018489567830462146, "2": 3.4909697326074505e-06, "1": 0}, "score": 4.862672302141404}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5455412270160854, "5": 0.45140603733422735, "3": 0.003025631950686482, "2": 2.6368564392967e-05, "1": 0}, "score": 4.448327997836182}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9920167398409256, "1": 0.005734102705580985, "3": 0.0022480052759513485, "4": 1.079753266362713e-06, "5": 0}, "score": 1.9965160618245816}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6992674443374627, "5": 0.28930129230600016, "3": 0.01141746589489515, "1": 0, "2": 0}, "score": 4.277887660555442}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.945294131171188, "1": 0.03439138094228588, "3": 0.019723031784838696, "4": 0.0005759796083875498, "5": 1.531263887978827e-05}, "score": 1.9865295457687737}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5516025004432128, "5": 0.44113849730224663, "3": 0.004062852361293178, "2": 0.0031870963876416357, "1": 8.836726988888127e-06}, "score": 4.430675035345841}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8893688278816686, "4": 0.11039019085916268, "3": 0.00024045730744438998, "2": 2.9138016891902633e-07, "1": 0}, "score": 4.889127994599768}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6097247824115335, "4": 0.37194034517545227, "5": 0.018274244771009193, "2": 6.023849248109485e-05, "1": 0}, "score": 3.408428755164845}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8790883714520018, "5": 0.11829059646989692, "3": 0.002588559851011294, "2": 3.188107450297469e-05, "1": 0}, "score": 4.115638342829786}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4165629701364974, "1": 0.3685745799155023, "5": 0.1170485000191538, "3": 0.078704298991488, "2": 0.019107569758690882}, "score": 2.8944030208189293}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5844880167447635, "4": 0.39136024518059265, "3": 0.018616470115451523, "1": 0.003477283129577339, "2": 0.0020547008775467467}, "score": 4.551332106033696}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9974258787465744, "1": 0.0025530386545579123, "4": 1.8214984107487682e-05, "3": 1.6487436241557465e-06, "2": 6.985116358841181e-07}, "score": 4.989764232049225}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7667653704151844, "5": 0.23277729452279472, "4": 0.0003970309978891018, "2": 2.4563351555734304e-05, "3": 2.109281704178077e-05}, "score": 1.9323806774852472}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8663567532464733, "5": 0.13283298390507986, "4": 0.0007905426101376688, "3": 1.1270036401173658e-05, "2": 4.786912147646685e-06}, "score": 1.5337328456537505}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6504743324461508, "1": 0.34920731756849777, "3": 0.0003161312760837509, "4": 2.0688451601808347e-06, "5": 0}, "score": 1.6511128991122521}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9994359249501822, "1": 0.0005294973487592669, "3": 3.41408822094134e-05, "4": 3.606618576444475e-07, "5": 0}, "score": 1.9995053648194956}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8767720943449387, "3": 0.09881378101478336, "1": 0.01824314291943359, "4": 0.006147641909752868, "5": 2.3357136239651332e-05}, "score": 2.092935991713444}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9982692010630246, "3": 0.0016054433981876899, "1": 0.00011452287193814962, "4": 1.0827157465086751e-05, "5": 2.0756694827881447e-08}, "score": 2.001512637088201}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8024467029122276, "2": 0.19687395054136303, "3": 0.0006703148705025705, "4": 7.64133677149773e-06, "5": 1.0730065392206854e-06}, "score": 1.1982418592274433}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6520857221548718, "3": 0.34100552482398516, "4": 0.006561310005515472, "1": 0.0003355037245915506, "5": 1.1856219212477946e-05}, "score": 2.353828239161219}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6935231627509052, "1": 0.3055149088769602, "3": 0.0009591702213797819, "4": 2.636527098022682e-06, "5": 9.191974293743087e-08}, "score": 1.6954498011115116}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9783095194128113, "3": 0.012394511813884353, "1": 0.009262650872162591, "4": 3.3033842225545586e-05, "5": 1.9098097904703265e-07}, "score": 2.00319850186682}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9558125715653119, "3": 0.036227227571825386, "4": 0.006242078869001874, "1": 0.001710080215360917, "5": 8.086027385272068e-06}, "score": 2.047025561095796}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.99751411863324, "3": 0.0024065935405985137, "1": 4.829396274721185e-05, "4": 3.101892673326416e-05, "5": 4.3970011157551215e-08}, "score": 2.002420469174258}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5461289821999356, "4": 0.4162423983818268, "3": 0.025253684831179155, "5": 0.012373304376454218, "1": 1.010222453876506e-06}, "score": 2.89485793930306}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7965507383729056, "2": 0.19426122598027346, "3": 0.007893626636377049, "4": 0.0011909047102454716, "5": 0.00010144731076784273}, "score": 1.214027422878982}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9979245818647222, "2": 0.0019265321610630619, "3": 9.389654189100873e-05, "4": 3.6470275464190495e-05, "5": 1.726994241856021e-05}, "score": 1.002292818705134}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9991688017368181, "5": 0.0003800173303878354, "4": 0.00034834524034816256, "2": 7.868437193186884e-05, "3": 2.1906503538477106e-05}, "score": 1.0026876084547935}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8213589782217546, "2": 0.17662590749759766, "3": 0.0019764776167139637, "4": 3.7319297718292896e-05, "5": 1.1481116599867423e-06}, "score": 1.1806954436543475}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"1": 0.999768477225535, "2": 0.0002313189647699656, "3": 1.1491696647787363e-07, "5": 1.2839570363898354e-08, "4": 0}, "score": 1.0002316001745983}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5900804827174798, "2": 0.19994239078546772, "4": 0.19349128621633765, "5": 0.01145337308258725, "1": 0.0050323409777788}, "score": 3.006390960447156}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9905231124416679, "4": 0.009464796450935594, "3": 1.0583884964733898e-05, "1": 3.546448396311909e-07, "2": 0}, "score": 4.990512606264819}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9034856335154143, "4": 0.0963282450965255, "3": 0.00018249039800447242, "2": 2.9364006363466793e-06, "1": 0}, "score": 4.9032978977373}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999531988512079, "4": 4.162100875611401e-05, "1": 4.486897836527395e-06, "3": 1.2124203500099385e-07, "2": 0}, "score": 4.999940188881616}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9290090068550108, "5": 0.07029197080419136, "4": 0.0005437146441110114, "2": 0.00011883542562387555, "3": 3.455044942070604e-05}, "score": 1.28298750732508}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9676886674238214, "3": 0.031229004018951845, "4": 0.0006719356372029014, "1": 0.0004026869890162275, "5": 7.634600083781279e-06}, "score": 2.0321930944009563}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.40187101502334055, "4": 0.3816394745196702, "5": 0.2161024668969954, "3": 0.0003855672235529687, "1": 7.511127975419368e-07}, "score": 3.411972189836698}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.998576135258673, "4": 0.0013114105045327893, "3": 8.28768323416083e-05, "5": 2.901879019616715e-05, "1": 4.759661969726496e-07}, "score": 2.0027922784765746}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.999934246531854, "4": 4.482004883551732e-05, "3": 1.6884390532179745e-05, "1": 2.13872436026263e-06, "5": 1.4807231124736744e-06}, "score": 2.0001088279799313}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7574863208844611, "4": 0.24150760879217684, "3": 0.000923292936030172, "2": 5.616771119889064e-05, "1": 2.3507218823659273e-05}, "score": 4.756382517514033}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5752854480354912, "4": 0.4219826413642915, "3": 0.0023155554153097466, "2": 0.0002896671652897346, "1": 0.00012536688996446775}, "score": 4.57201521332597}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5632905552739711, "3": 0.28626927217627696, "4": 0.13315116729417703, "1": 0.009403581985544565, "5": 0.007883392085767597}, "score": 2.566819352350938}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9807108354060518, "4": 0.019176406187458514, "3": 8.73972273054451e-05, "1": 1.2938800115090441e-05, "2": 8.788812078966382e-06}, "score": 4.980570607123232}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977165121341695, "4": 0.0022582493268932806, "1": 1.314277999412506e-05, "3": 8.833793682483622e-06, "2": 1.4924044706392528e-06}, "score": 4.997667030624022}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9989977051333858, "2": 0.001001697718477143, "3": 4.3554008554947476e-07, "5": 2.821110901141456e-08, "4": 0}, "score": 1.001002681776839}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9996095603214171, "3": 0.0002429859342606696, "4": 0.0001386796445840641, "5": 7.461649914792043e-06, "1": 1.228379176806172e-06}, "score": 2.0005415018395207}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.960732523671801, "4": 0.039112201572260384, "3": 9.77349827555687e-05, "2": 5.539639713445029e-05, "1": 1.4710781362185926e-06}, "score": 4.9605202284161125}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5680173016917456, "4": 0.2439333614015582, "3": 0.1546441202957405, "5": 0.033401365386490335, "1": 3.49227559946933e-06}, "score": 2.742711713578256}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6716075446481867, "4": 0.2223352502405947, "3": 0.10191800107877463, "5": 0.0039169993117770625, "1": 0.00022217482189120202}, "score": 2.558117341360429}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8593341532675819, "3": 0.09941217379818792, "4": 0.04106301257559986, "5": 0.0001642563895477547, "1": 2.551750170122009e-05}, "score": 2.1820056119583677}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3580774053110799, "1": 0.26679115971263284, "5": 0.25047992534795055, "2": 0.08768705464679336, "3": 0.03696023773519642}, "score": 3.2377688846648818}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9510849969854834, "4": 0.04872669729616155, "3": 0.00018066302540151598, "2": 3.629462471968005e-06, "1": 2.9407850160300283e-06}, "score": 4.950889272456978}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8867194123775219, "5": 0.09917134175776637, "3": 0.013842689771831363, "2": 0.00026478960254123135, "1": 0}, "score": 4.0847992225778595}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6572982671705804, "3": 0.2740507693937177, "2": 0.03925938323549851, "5": 0.029310630882830754, "1": 8.015318032762884e-05}, "score": 3.6765003779271}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8512259623319459, "2": 0.14462556309394856, "3": 0.0034740785520691133, "4": 0.0005478275556549499, "5": 0.0001264089843574753}, "score": 1.1537228633185148}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9896087282153497, "4": 0.008678426895256419, "1": 0.00146395968703562, "3": 0.000186622443647839, "2": 6.134137398711093e-05}, "score": 4.984908451442221}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9320633262356847, "4": 0.06531144435103399, "3": 0.0015325451943272545, "1": 0.0008585001524925735, "2": 0.000233935762388797}, "score": 4.927487639358061}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984978159097164, "4": 0.0014954531615153795, "3": 5.3978976730728465e-06, "2": 5.114162495274366e-07, "1": 2.8970142885349305e-07}, "score": 4.9984910571860475}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9695403109993235, "1": 0.02990923450343376, "4": 0.00048735000349968703, "3": 3.221456108565274e-05, "2": 2.9550526411703304e-05}, "score": 4.879722470180885}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5142429550541909, "4": 0.46154857775708674, "2": 0.020859635566665834, "5": 0.0033343440687276073, "1": 1.4368532292598552e-05}, "score": 3.4473289465048453}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9906279202840789, "4": 0.009366322834919633, "3": 4.451279388827145e-06, "1": 0, "2": 0}, "score": 4.990624762365976}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7688080888380231, "4": 0.21271151945816918, "2": 0.018211117859577814, "5": 0.00026402995377110874, "1": 5.234600656147121e-06}, "score": 3.1950179941165}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9825397608490635, "4": 0.017446797003318592, "3": 1.2469760556754813e-05, "2": 3.3687900724734467e-07, "1": 0}, "score": 4.982527241734467}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9551871529747914, "4": 0.04479586244341786, "3": 1.604513290774283e-05, "2": 1.9621869675252292e-07, "1": 0}, "score": 4.955171425316726}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9338982245330792, "4": 0.06527446895067077, "3": 0.0007856716507131643, "2": 3.490400426327831e-05, "1": 6.489383656109713e-06}, "score": 4.933023502027162}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8393421237559354, "5": 0.15176846136508476, "3": 0.008877697909618777, "2": 1.1094644983206974e-05, "1": 3.7789895193018016e-07}, "score": 4.142867475389088}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997122460291178, "4": 0.0002870398504791354, "3": 3.0656347707348887e-07, "1": 0, "2": 0}, "score": 4.999712346905331}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994447374153582, "4": 0.0005546021212284848, "3": 3.02867627448852e-07, "1": 0, "2": 0}, "score": 4.999444791944977}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5704521425798591, "5": 0.4282605957974679, "3": 0.0011746676763827442, "2": 0.00010605921370115083, "1": 5.855846465336377e-06}, "score": 4.426856531941263}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7743137234969327, "5": 0.22078420554402495, "3": 0.004839475170404639, "2": 6.100968108939281e-05, "1": 1.4746542535829895e-06}, "score": 4.2158183111023435}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6226118550236694, "4": 0.3769322673036013, "3": 0.00039444351861777125, "2": 5.9307012755891165e-05, "1": 1.9248028712763412e-06}, "score": 4.622093148944311}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8783723380620474, "5": 0.10028605766575513, "3": 0.02038982045452032, "2": 0.0009386195743353808, "1": 1.318079120451637e-05}, "score": 4.077979454398557}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992912726659434, "1": 0.0006660247672848203, "4": 4.0921989451124397e-05, "3": 6.768765021166809e-07, "2": 0}, "score": 4.997293622201374}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6848059948713133, "5": 0.28034247450123806, "3": 0.025415374316992822, "2": 0.009309629354801499, "1": 0.00012610836259794743}, "score": 4.235929615145347}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9160225607239606, "3": 0.048198204965438696, "5": 0.03556564269369014, "2": 0.00021219667523069438, "1": 7.545977584007953e-07}, "score": 3.9869407722221184}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.813914113676706, "3": 0.1639641291134024, "5": 0.012148458374537405, "2": 0.009844221949788639, "1": 0.00012875644003268905}, "score": 3.8281095609599363}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5783240368554572, "1": 0.37076893393114296, "4": 0.03305487565382235, "3": 0.014824536490254066, "5": 0.0030264771277137862}, "score": 1.719244465204981}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8823919799406529, "4": 0.0862690998543413, "1": 0.029444215671779368, "2": 0.0009475306246496961, "3": 0.0009429962047445977}, "score": 4.791224580973235}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9606486899667407, "3": 0.030387856731284957, "4": 0.008865666136303385, "5": 7.398353422442331e-05, "1": 2.3443881827301354e-05}, "score": 2.0483177131070165}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9768778855038847, "2": 0.023029421151668648, "3": 9.138108942324162e-05, "4": 1.2425187357684758e-06, "5": 1.3756490429157732e-07}, "score": 1.0232164595715991}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7161492672043727, "1": 0.2807638652831946, "3": 0.003070508794522791, "4": 1.572398978576619e-05, "5": 5.567035304672885e-07}, "score": 1.722339739937162}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5492714034358104, "5": 0.3875310129391041, "3": 0.045258313588454585, "2": 0.01031748758122001, "1": 0.007621188121358065}, "score": 4.298774337395898}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8712240692914662, "3": 0.06571000381593492, "5": 0.04166899299610368, "2": 0.020624891652238308, "1": 0.0007694983876570584}, "score": 3.932400538749385}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.848493487200211, "3": 0.14087446560891553, "4": 0.007754667180794401, "1": 0.0027461646870516653, "5": 0.00013101352445205378}, "score": 2.1540307069399858}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5579239032525455, "3": 0.19921335358682857, "1": 0.14742091743009367, "4": 0.09433695297343689, "5": 0.0011044547551992117}, "score": 2.2437798082696285}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7176134179807123, "2": 0.15074563485195774, "4": 0.130765897033181, "1": 0.00067543542566768, "5": 0.0001993835901423167}, "score": 2.9790681536724386}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6570630622131978, "4": 0.31462434731950145, "2": 0.02801861130922657, "5": 0.0002817980157122001, "1": 1.2199543804475264e-05}, "score": 3.28714492767021}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5795034284493923, "5": 0.41315671615279514, "3": 0.006399137905213962, "2": 0.000853100668872997, "1": 8.669641712524655e-05}, "score": 4.404791660231375}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6699468487284375, "3": 0.31586107441232386, "4": 0.011378268667945557, "1": 0.0028090076709962994, "5": 4.865407910017304e-06}, "score": 2.335823178510184}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4650551073437122, "2": 0.31393645065683007, "3": 0.19827159426210397, "5": 0.016536751687466197, "1": 0.006199283240406954}, "score": 3.171793733216576}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6253038858819499, "3": 0.19951293652853255, "4": 0.10064798972719204, "1": 0.07019007919119673, "5": 0.004344313197836658}, "score": 2.3436520497512574}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.505379068801219, "3": 0.4458100564833651, "2": 0.03241829678465235, "5": 0.016379954145191337, "1": 1.1722716703934831e-05}, "score": 3.505697690541987}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9927708258011008, "4": 0.003875874361316522, "1": 0.003264983075112337, "2": 4.707313979380103e-05, "3": 3.8712384352964763e-05}, "score": 4.982845505728034}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6080818283316927, "5": 0.38626827807994574, "3": 0.005259362275405172, "2": 0.00034932197380985126, "1": 3.485046771654586e-05}, "score": 4.380208138148437}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5706928671160837, "4": 0.4283710584486707, "3": 0.0008135664097772868, "1": 7.609363017125684e-05, "2": 4.563274532141165e-05}, "score": 4.569560199521866}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8609005383366309, "1": 0.07419640352477655, "3": 0.036002838370824825, "4": 0.019802610629467206, "5": 0.009097178213269308}, "score": 2.0287032031137198}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9433093258177256, "1": 0.04804396258766619, "4": 0.008290868089979583, "3": 0.0002630827332920466, "2": 8.823383956465289e-05}, "score": 4.7987415034905965}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6077829019144608, "1": 0.23981115968567954, "4": 0.1493694816362041, "3": 0.0020542885404600327, "2": 0.000968847826695249}, "score": 3.884355898238282}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7790947735384028, "2": 0.20103219693397278, "4": 0.015034456683130725, "1": 0.004334906229543843, "3": 0.0005017482791448679}, "score": 4.363524610064956}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5844983038243843, "3": 0.28601592153757066, "4": 0.12689991171085252, "5": 0.002045898135168102, "1": 0.0005398090996906217}, "score": 2.5454137151818244}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.928323924990836, "3": 0.07012354247678905, "4": 0.0008826222074916842, "1": 0.0006636232261728539, "5": 6.1645279106864286e-06}, "score": 2.071243665981725}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9062539266205167, "1": 0.07652817540575926, "3": 0.012083342835060953, "4": 0.004894755270801267, "5": 0.00023937528677845052}, "score": 1.9460627809305167}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9865742882391964, "1": 0.007655063153034413, "3": 0.005277827100307537, "4": 0.00048791419377487266, "5": 4.7796559071686675e-06}, "score": 1.9986129311254741}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.45582733157676025, "2": 0.4306164897344645, "4": 0.10915907030373968, "1": 0.0032218820583592212, "5": 0.001174905923144919}, "score": 2.674448523991004}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5065190423740562, "4": 0.40343955670588544, "3": 0.04892586919459326, "2": 0.04103658881980315, "1": 7.70542375735916e-05}, "score": 4.375289541624517}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9000416625563298, "4": 0.09898772761663363, "3": 0.0008398119166065158, "2": 0.00011783054793893834, "1": 1.2822386106995934e-05}, "score": 4.898927852708834}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9920256581115043, "4": 0.007962619104633487, "3": 1.10075187052423e-05, "1": 0, "2": 0}, "score": 4.992015360146821}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9732660456101899, "4": 0.02666099348292435, "3": 6.642809323971937e-05, "2": 2.415128652552955e-06, "1": 2.0875613321131454e-06}, "score": 4.973190500272709}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5048676112582025, "4": 0.4654625949772762, "3": 0.029636007125316968, "1": 0, "2": 0}, "score": 4.475247661154145}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9217545090902503, "3": 0.07614081683641713, "4": 0.0019216520888226203, "1": 0.00017828075054004142, "5": 4.681228417993375e-06}, "score": 2.0798198887384123}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9663873613116991, "3": 0.02117661652825294, "1": 0.012182991978835649, "4": 0.0002514294813470476, "5": 1.5251496829003819e-06}, "score": 2.009501059678967}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7260699056635795, "2": 0.20506399045315019, "4": 0.0687274222505569, "5": 8.875604670875415e-05, "1": 4.985080067501792e-05}, "score": 2.863741232099317}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9728105041275946, "3": 0.019779182169045784, "4": 0.005559164232023005, "5": 0.0018499055412115808, "1": 1.065146190657821e-06}, "score": 2.0364461686265254}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8062120110981839, "3": 0.1241134142932933, "1": 0.056461121089742806, "4": 0.01285749460390385, "5": 0.0003557323271327155}, "score": 2.0944345007904563}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9401690306907202, "3": 0.04750721902573957, "4": 0.006687868937884041, "1": 0.005632521886010497, "5": 3.1746791050596927e-06}, "score": 2.0552599692637794}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6156907135069376, "3": 0.26159344946081786, "2": 0.09197428977099192, "5": 0.02865788372578073, "1": 0.002080572464122568}, "score": 3.576872829414338}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9354992172375347, "3": 0.042080185596466174, "1": 0.021863956935754086, "4": 0.0005543972890397373, "5": 2.054128269029475e-06}, "score": 2.0213311896512027}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8656460951976089, "4": 0.07995522407985683, "1": 0.05062574690425357, "3": 0.0024436821483430045, "2": 0.0013128451849753098}, "score": 4.708711109424715}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4932114609628313, "5": 0.47349065621176173, "3": 0.03296976993279618, "2": 0.00032626422459064365, "1": 1.0848194395301269e-06}, "score": 4.439865439362056}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9710124188691952, "2": 0.028911848071663214, "3": 7.413973014880988e-05, "4": 1.3086139949116309e-06, "5": 2.40511243012632e-07}, "score": 1.0290650167037003}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7987185804211765, "3": 0.13674997780274817, "5": 0.04471515038502511, "2": 0.01981348722886093, "1": 1.258252128067369e-06}, "score": 3.8683342198247166}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6072648238213192, "3": 0.30250332797545676, "2": 0.05531600450160105, "5": 0.034705920048359706, "1": 0.00020787554472700314}, "score": 3.6209461800921554}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9889767175915254, "2": 0.010397461387366785, "3": 0.0004463752017837134, "4": 0.0001472651285695539, "5": 3.2101557781086133e-05}, "score": 1.0118604143463172}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4638306369315726, "4": 0.4591741633690066, "5": 0.03841953979423139, "2": 0.03804298021997585, "1": 0.0005319257212931789}, "score": 3.496906785944695}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5920275133054168, "1": 0.3072792917033585, "3": 0.09079210014211495, "4": 0.009798532984208769, "5": 0.00010121273187324914}, "score": 1.8034132473811129}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.958713091041228, "3": 0.03311491148521992, "4": 0.007825885390586809, "1": 0.0002950841464779999, "5": 5.091790133853569e-05}, "score": 2.0486243571743192}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9852174832539912, "4": 0.014607838657423098, "3": 0.0001731292729547802, "2": 6.706596880104819e-07, "1": 0}, "score": 4.985043877683796}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9728132124358081, "5": 0.02117474459809238, "4": 0.003845029514427594, "2": 0.0015288400016337362, "3": 0.0006359383075732577}, "score": 1.0990350049097775}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9636434162086895, "4": 0.03621637189852602, "3": 0.00013812396209014256, "2": 5.750407092267216e-07, "1": 4.914390073367952e-07}, "score": 4.963503652019907}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8387799025544962, "3": 0.12266619188396026, "5": 0.028532262911218263, "2": 0.009221781857992542, "1": 0.0007997363876787805}, "score": 3.885023283844598}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4535209111072158, "1": 0.41406962622911336, "5": 0.10156275456246783, "3": 0.01784069313011669, "2": 0.01300350425198225}, "score": 2.8155032003023024}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8179066734706097, "4": 0.17275490899150775, "1": 0.007771269835214037, "3": 0.001149638538916068, "2": 0.0004168753090272116}, "score": 4.792609977207578}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9794954909776704, "4": 0.011442829382097564, "2": 0.003580497219804698, "3": 0.0034417541852435835, "5": 0.002039136999690115}, "score": 1.0529490571559896}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5904355760346628, "1": 0.29246078198012665, "3": 0.08360878338470608, "4": 0.03331384175645128, "5": 0.0001808879100543681}, "score": 1.8583183303800608}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5218772614860308, "3": 0.3795134163767262, "2": 0.09463896457895232, "1": 0.0025207588294236735, "5": 0.0014493568103919124}, "score": 3.425095595707493}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9951851865554847, "2": 0.004796817028938826, "3": 1.492037991561171e-05, "4": 2.4052348703156256e-06, "5": 5.266645597901286e-07}, "score": 1.00483598084866}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5566650869821996, "5": 0.44097019096656737, "3": 0.002339802628417615, "2": 2.1069627699511334e-05, "1": 3.356687276334023e-06}, "score": 4.438578395287366}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5273022317733473, "4": 0.32947921745597597, "5": 0.07205934956503292, "2": 0.04343536534505996, "3": 0.027706791924890773}, "score": 2.375547444565089}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7812539358939189, "1": 0.11816043019286808, "3": 0.08011056788218476, "4": 0.020194366492115375, "5": 0.0002797246028664448}, "score": 2.0031780475805396}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8194611982477913, "5": 0.1273082586540909, "2": 0.03044949407216179, "3": 0.022776795556943705, "1": 4.0787295615935435e-06}, "score": 4.0436202463863165}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8987802254229957, "3": 0.07829046958970688, "5": 0.020157265194815824, "2": 0.0027656474839809642, "1": 6.080449097461499e-06}, "score": 3.936317239429787}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6130710159004221, "5": 0.20967547514750107, "1": 0.11355953978510627, "2": 0.038548137269406285, "3": 0.02513394389567597}, "score": 3.766763864646076}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5839675866534244, "2": 0.21095032495011726, "5": 0.15922819770395075, "3": 0.029029152363825878, "1": 0.01682233182465619}, "score": 3.6578305765338275}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9998620238095902, "4": 7.012052575550715e-05, "5": 5.270459049729242e-05, "1": 1.0643523211089955e-05, "3": 4.501067351908217e-06}, "score": 2.000292212369038}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4755575375527924, "3": 0.3873666184090799, "2": 0.13058476798379087, "5": 0.005720000420937277, "1": 0.0007709087069784941}, "score": 3.354871012234267}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6650616472442322, "4": 0.331771068708123, "3": 0.0030214059789173547, "2": 0.00013511557968429885, "1": 1.0140380863537085e-05}, "score": 4.661740000637224}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999725091278809, "4": 2.7206680723123157e-05, "3": 9.003656242016769e-08, "1": 0, "2": 0}, "score": 4.9999726132408355}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8929506033795811, "5": 0.1070426848754132, "3": 5.559529920214886e-06, "1": 0, "2": 0}, "score": 4.107037248675426}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8218607189084836, "5": 0.17347156214060763, "2": 0.0027399423471216647, "3": 0.0019273119864156604, "1": 0}, "score": 4.166064442616372}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.9712510910060096, "2": 0.016184083819041614, "4": 0.01215901997321486, "5": 0.0003895834759323471, "1": 1.5877699188762457e-05}, "score": 2.9967223465800603}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.956878188858413, "3": 0.027208512366215465, "4": 0.0151418476616624, "5": 0.0007701914790037213, "1": 1.082647638245029e-06}, "score": 2.059801710063043}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6392180285898649, "2": 0.25661170810413386, "4": 0.10039631254885789, "5": 0.0037632813601346073, "1": 9.975624406545978e-06}, "score": 2.8512911127460288}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9592545419204836, "4": 0.0385307174485366, "3": 0.001665445539590937, "2": 0.0005392080871796898, "1": 0}, "score": 4.9565203286311155}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9986463952504614, "3": 0.0010997586855688534, "4": 0.00024192761212605087, "5": 8.731023112171541e-06, "1": 3.0913891653674223e-06}, "score": 2.0016067157443005}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6335194989365471, "2": 0.17247527260557058, "3": 0.17048831812529783, "1": 0.01275583710480676, "5": 0.01075935145245989}, "score": 3.457052041967207}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9879718599222065, "2": 0.012020160466569509, "3": 7.7248666304204e-06, "4": 1.1365241925327794e-07, "5": 2.1051332019161865e-08}, "score": 1.0120360368072323}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7962033427857729, "2": 0.14641620407609754, "3": 0.030872091219078572, "4": 0.026505911377964025, "1": 1.8780566735957845e-06}, "score": 4.472493479739631}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9740880042322746, "5": 0.02518928936530184, "1": 0.0004489170190985941, "4": 0.00018348016297348586, "3": 8.98966392849723e-05}, "score": 2.0755758392231995}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8941750568018686, "2": 0.10356042709255245, "4": 0.00221202100375209, "5": 5.144774117253942e-05, "1": 8.727724220744654e-07}, "score": 2.898752726172119}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9862985748194149, "2": 0.01367931282691578, "3": 2.014321602411704e-05, "4": 1.6824121344512061e-06, "5": 1.9456471583523597e-07}, "score": 1.0137254260191766}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8073794362386805, "4": 0.1914269892956725, "2": 0.000946634021881225, "3": 0.000244684972826512, "1": 0}, "score": 4.805243299424951}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8994799913771394, "4": 0.09768377532482803, "2": 0.0024325005932968303, "3": 0.00039902172257998494, "1": 3.894123251000051e-06}, "score": 4.894205016537542}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5877234704817959, "5": 0.14686909487475672, "4": 0.1395952381372968, "1": 0.12285025553010222, "3": 0.0029589331438193574}, "score": 2.5999082429359284}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7713115048291392, "5": 0.2213649460131828, "3": 0.007216525316656914, "2": 0.00010667177087823798, "1": 1.8620139131085932e-07}, "score": 4.213934554035652}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.979111812542766, "4": 0.020747239029039757, "3": 0.00013516341906657814, "2": 2.671533248489943e-06, "1": 2.6470850619687265e-06}, "score": 4.978963821381753}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5041879468539882, "2": 0.482249738232986, "3": 0.013433509293656977, "4": 0.00012782249682730636, "5": 5.884237413710931e-07}, "score": 1.5095027791058833}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7627004803577211, "4": 0.23573836778519922, "3": 0.001077533118534278, "1": 0.00026287892316037266, "2": 0.0001930205303203381}, "score": 4.760469349075735}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6145859007987472, "4": 0.37728873852214645, "3": 0.00686474078086164, "2": 0.0011867829927409616, "1": 7.304425993955126e-05}, "score": 4.605128940905355}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6940494620844035, "2": 0.300995098024128, "3": 0.004892425921721427, "4": 6.231103631165904e-05, "5": 4.519410888550169e-07}, "score": 1.3109687687916423}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.52789778660048, "3": 0.394750247052938, "2": 0.054258517189489736, "5": 0.022440928997701618, "1": 0.0006519204582688306}, "score": 3.5172175966658292}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9826467996479415, "4": 0.017305342675182828, "3": 4.6288037480820315e-05, "2": 1.5197542603388123e-07, "1": 0}, "score": 4.982601600658493}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9617214117807591, "4": 0.038078079638188905, "3": 0.00019720120603860774, "2": 2.571464440853262e-06, "1": 0}, "score": 4.961519775238408}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8883912110683952, "4": 0.10389233047619792, "1": 0.007105394462311647, "3": 0.000527215750217161, "2": 8.140954755528186e-05}, "score": 4.866387105690315}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7831170304372711, "4": 0.21648253598272893, "3": 0.0003924513411575666, "2": 7.202841190417639e-06, "1": 0}, "score": 4.782710783456681}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9940509315046032, "4": 0.0059410790729105085, "3": 5.522344829053974e-06, "1": 1.256505629085823e-06, "2": 0}, "score": 4.9940428430033466}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7924818703677053, "1": 0.20548309730209657, "4": 0.0019364032916867084, "3": 6.30492115995677e-05, "2": 3.0871442263118485e-05}, "score": 4.17590861461071}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.6380251349117272, "5": 0.35980656909612774, "4": 0.0016434026499307117, "3": 0.0003674250153479031, "2": 0.0001541255543084408}, "score": 2.445050290393763}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9996792476720305, "5": 0.0003077022387214268, "3": 1.1500569523945345e-05, "1": 0, "2": 0}, "score": 4.000296202128169}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8676075481783575, "5": 0.12980603255781636, "3": 0.0024892311283107537, "2": 7.974607769632833e-05, "1": 0}, "score": 4.127159527197938}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6455848944449629, "3": 0.166608921543818, "5": 0.11952147698919473, "2": 0.0682828528700942, "1": 1.5892267194536986e-06}, "score": 3.8163420333694047}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5583071611734555, "3": 0.34780127888449897, "2": 0.07210008902129289, "5": 0.02146258054373136, "1": 0.00032787307202763}, "score": 3.5284770247178865}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6679109651716489, "3": 0.30861377591924916, "2": 0.01869506301259565, "5": 0.004767272216626377, "1": 1.249492495122397e-05}, "score": 3.65872573917431}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7459451551848223, "3": 0.22423665259843037, "2": 0.02105792300256549, "5": 0.008733891034586251, "1": 2.593031008352132e-05}, "score": 3.7423034860863624}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9490208102533931, "3": 0.05012674905995473, "4": 0.0008510084499536069, "1": 6.621604094595232e-07, "5": 4.3254736591694807e-07}, "score": 2.0518294189354784}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8142112465516488, "4": 0.136329953891034, "5": 0.04606512144690458, "2": 0.003385754507888037, "1": 7.266200719957159e-06}, "score": 3.225060057830403}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6161946531446166, "5": 0.312096014416505, "3": 0.061998331846538635, "2": 0.00968599743322099, "1": 2.349972121678642e-05}, "score": 4.2306555353161475}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.961374885216561, "4": 0.03834776622238434, "3": 0.00026880590004069806, "2": 5.829321180341384e-06, "1": 0}, "score": 4.96109702845701}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6922429715737104, "3": 0.1456049276561501, "5": 0.09650844128566642, "2": 0.06560875051047718, "1": 3.408002917260014e-05}, "score": 3.819583622965823}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.39805420082196374, "5": 0.28802039078951674, "1": 0.202072547503805, "2": 0.08033123940477734, "3": 0.031517204740994315}, "score": 3.4896208105159108}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8015885762004743, "4": 0.19784703447839166, "3": 0.0005425787075672058, "2": 2.095293135299922e-05, "1": 5.587459161215859e-07}, "score": 4.80100265484122}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.47588803643130645, "5": 0.46496164531046885, "3": 0.035963368508619274, "2": 0.01806465883454204, "1": 0.005120936226032434}, "score": 4.377506661858803}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9762240797626784, "4": 0.023732596406554774, "3": 4.232765089543718e-05, "1": 0, "2": 0}, "score": 4.976182724565364}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8979773353766048, "5": 0.09615526983239792, "3": 0.0054463163386298105, "2": 0.00041802404632534966, "1": 2.745300547294743e-06}, "score": 4.089864697277147}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9306287276667238, "4": 0.050688561767581436, "3": 0.018680245572283472, "1": 0, "2": 0}, "score": 4.911950730046981}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.809884236038871, "2": 0.1779816186559783, "3": 0.009970535353606431, "4": 0.002135421986661531, "5": 2.6967017844201988e-05}, "score": 1.2044370730013914}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6846569836052133, "3": 0.16909608082783992, "1": 0.07798321248562035, "4": 0.06769357551147637, "5": 0.000569389969037077}, "score": 2.2282083621631243}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3714413874314549, "2": 0.30782769018776324, "4": 0.248727912712837, "1": 0.065660923639721, "5": 0.00634032468309276}, "score": 2.822258711548064}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9516552329934143, "4": 0.046855288271886314, "2": 0.0014171812717874224, "3": 6.30079908958209e-05, "1": 4.522403308522709e-06}, "score": 4.948748817999819}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9815485179863501, "4": 0.010590512773529808, "3": 0.007768548036141702, "5": 8.230299991282033e-05, "1": 9.766357367182461e-06}, "score": 2.0291867264948262}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9275393310081572, "5": 0.031066879348511656, "4": 0.028609999196634588, "3": 0.012741409489361288, "1": 4.2073288334929875e-05}, "score": 2.1631200228268046}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7899235660794434, "5": 0.08694725574321853, "2": 0.06290205153429969, "3": 0.06006633765096005, "1": 0.0001597181274168424}, "score": 3.9005975541948423}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997718141583503, "4": 0.00022516772252791038, "3": 2.6238627339699376e-06, "1": 0, "2": 0}, "score": 4.999769584461161}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6962932995607599, "4": 0.3011457235475023, "3": 0.002179511521490413, "2": 0.0003808720751419991, "1": 2.6531156091234727e-07}, "score": 4.693351475362177}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9998652418606938, "4": 8.132882932696758e-05, "5": 4.0265964467691355e-05, "3": 1.3028321411893817e-05, "1": 5.3611780905904324e-08}, "score": 2.0002964302858213}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"2": 0.41820455505402265, "3": 0.4029112518587236, "4": 0.17657033206976042, "1": 0.001556357692726397, "5": 0.0007566990043830713}, "score": 2.7567662640011994}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5370012267635486, "4": 0.4498020868325643, "2": 0.008522901879032782, "3": 0.004665107971194875, "1": 5.857755782485859e-06}, "score": 4.515274194220746}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8606339845409112, "4": 0.13924186806178726, "3": 0.00012245609504730643, "2": 7.433067679372427e-07, "1": 0}, "score": 4.860510857592736}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8991373547768419, "4": 0.09591237161912848, "1": 0.004020903300403172, "3": 0.0008607217297723205, "2": 6.553743839907969e-05}, "score": 4.886085605001404}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9026864836834481, "5": 0.05616890314754044, "3": 0.040516256108830216, "2": 0.0006207243223234013, "1": 6.153343286712964e-06}, "score": 4.014392759656775}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9747028243327986, "2": 0.02520879594324644, "3": 8.187466136642557e-05, "4": 4.2540376105724775e-06, "5": 2.1252693726961608e-06}, "score": 1.0253938116497159}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9912954201483583, "2": 0.00869694903898641, "3": 7.024858396707037e-06, "4": 2.647756429318517e-07, "5": 2.065903479273692e-07}, "score": 1.0087126206167167}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5615616026262336, "1": 0.2076845161475671, "3": 0.14214434835417394, "4": 0.07836013210768962, "5": 0.010248325014198976}, "score": 2.1219252026256363}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.747885505677291, "1": 0.14255035118995626, "4": 0.07129336595501108, "2": 0.033286029651767926, "3": 0.00497939291497521}, "score": 4.248684331496768}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9358089599068032, "1": 0.046970750536960044, "3": 0.01688077801399495, "4": 0.00032226898628701274, "5": 1.7126441537267728e-05}, "score": 1.9706059413611465}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6623487295158023, "3": 0.19813523031982674, "4": 0.11822082560240955, "1": 0.01897522686077205, "5": 0.0023196081695574153}, "score": 2.422560639547675}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.647694418659246, "2": 0.351845894134863, "3": 0.00045293976971842595, "4": 6.180829946261124e-06, "5": 5.511504588530063e-07}, "score": 1.352772526218344}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9992377107302015, "4": 0.0004578312003372373, "1": 0.00029604709842416906, "3": 6.822654083562756e-06, "2": 1.1376452522361347e-06}, "score": 4.998340921414343}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.4602439840512519, "4": 0.279064762623175, "5": 0.2247915389036275, "2": 0.02382236103761495, "3": 0.012074336852490649}, "score": 2.784336860735585}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997958844344171, "4": 0.00018187371233656374, "1": 1.9704234422760012e-05, "3": 1.307108646697575e-06, "2": 0}, "score": 4.999736694808679}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8657355124006539, "3": 0.13192931397718924, "4": 0.0018445074535059134, "1": 0.000489125233524813, "5": 1.593864480049621e-06}, "score": 2.135133978091562}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8885827022189846, "3": 0.09774554075811953, "4": 0.012598330169969169, "1": 0.0009647135886551609, "5": 0.00010866639122588583}, "score": 2.122303492415818}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8576370908576774, "2": 0.0607046364987105, "5": 0.05727046117290558, "3": 0.024373090588434884, "1": 1.4409108739563891e-05}, "score": 3.9114448426516772}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5570941627119168, "1": 0.41911863948930445, "4": 0.023323715580066996, "3": 0.00025309275901716114, "2": 0.0002064465534765313}, "score": 3.2990694946747854}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.916765261292423, "5": 0.05976173534549218, "2": 0.01761889100521498, "3": 0.005849668418166968, "1": 0}, "score": 4.018674367904642}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5877780901617718, "2": 0.3594249089481274, "3": 0.04240092928013849, "4": 0.010234949437882918, "5": 0.00015922472322051296}, "score": 1.475569417083583}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8261713677250312, "5": 0.10465415783652697, "3": 0.06695144659389787, "2": 0.0021894804516243834, "1": 2.9477774068200098e-05}, "score": 4.033235452272799}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6499036875962456, "3": 0.3331155007636035, "1": 0.011114530196284843, "4": 0.005740178336825129, "5": 0.00012592286764598188}, "score": 2.333859156018479}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7316953501287029, "2": 0.250399258756048, "3": 0.014413174425468758, "4": 0.0034326023597819662, "5": 5.698673708066028e-05}, "score": 1.2897521229852804}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5352457991134679, "2": 0.2778662489364453, "4": 0.1845671915420356, "5": 0.001285586300129269, "1": 0.0010335731525224678}, "score": 2.9072048203398593}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8274820035030326, "2": 0.17230941394489924, "3": 0.00020642611627939497, "4": 1.6793546084415981e-06, "5": 4.454739791207831e-07}, "score": 1.1727290915966826}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9989759313165953, "4": 0.0010217340971162053, "3": 1.847788572703842e-06, "2": 1.79936108831915e-07, "1": 0}, "score": 4.998974030202582}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9860048130519358, "4": 0.011458787225967394, "3": 0.0021394718060845563, "2": 0.000396347978097415, "1": 0}, "score": 4.983073215411087}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9867720456613764, "1": 0.012987050933220164, "5": 9.183473086725344e-05, "4": 8.099565878297715e-05, "3": 6.794241838309216e-05}, "score": 1.9875183853652647}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970050393694736, "4": 0.00297113721138081, "3": 1.1416315974020376e-05, "2": 1.0295424342748264e-05, "1": 1.0572820992250816e-06}, "score": 4.996970911561385}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3027435504488893, "4": 0.2908043135622545, "1": 0.17932447582834657, "3": 0.1195322224529774, "5": 0.10759361211260145}, "score": 2.844598751982145}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7322692315351423, "4": 0.26354127023029145, "2": 0.002722486940626686, "3": 0.0014588526622151198, "1": 8.016946053014546e-06}, "score": 4.7253414569240055}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9856311929623582, "4": 0.01410636168524371, "3": 9.74259456836856e-05, "2": 8.383105788381014e-05, "1": 8.067224257774225e-05}, "score": 4.985124596602137}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993877088267916, "4": 0.0005635897301404119, "1": 4.281474522950616e-05, "3": 3.823600652905769e-06, "2": 1.4590223059805802e-06}, "score": 4.99925312656955}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990908572209484, "4": 0.0009056113658180295, "3": 2.0744800790320492e-06, "1": 5.30319066114342e-07, "2": 3.9301855989356266e-07}, "score": 4.999086938854874}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9751772652470722, "4": 0.024717306813545087, "3": 8.527314355442724e-05, "2": 1.8650809649032547e-05, "1": 1.3549052937320361e-06}, "score": 4.97505077112977}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.9472005871243713, "2": 0.05126337599461582, "4": 0.0015270721566473808, "5": 8.6975689707554e-06, "1": 0}, "score": 2.950281078017295}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9928467392368441, "4": 0.004616045005186972, "2": 0.001874464988019164, "3": 0.0003592598195162942, "1": 0.00030207718311929017}, "score": 4.987833714458948}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8632094219124049, "4": 0.1367836908272361, "3": 6.279312864195323e-06, "1": 0, "2": 0}, "score": 4.863203667382048}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.799901039172651, "4": 0.20008760166634962, "3": 3.91693146594959e-06, "1": 0, "2": 0}, "score": 4.799903075303476}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5928949178423619, "2": 0.258393877820368, "4": 0.14481401717803313, "5": 0.003161626716931433, "1": 0.0007353298381691641}, "score": 2.8912727080422265}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9601012483982561, "3": 0.037142403892151205, "4": 0.002177121472869478, "1": 0.0005523682580354675, "5": 2.676289887256965e-05}, "score": 2.0410245711770805}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9723871814605503, "4": 0.02759402541950228, "3": 1.7862357363296303e-05, "2": 3.368217426837382e-07, "1": 0}, "score": 4.972369222989496}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8139530603988382, "5": 0.12416362832447804, "3": 0.061819588421006356, "2": 6.314815031103457e-05, "1": 0}, "score": 4.062217779359741}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9033758847469301, "3": 0.04097549802760979, "1": 0.04060965633055461, "4": 0.014154651231017452, "5": 0.0008840601983183307}, "score": 2.031327332569136}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6634358328397587, "3": 0.28570070560713484, "4": 0.046250995080550805, "1": 0.004324356222355634, "5": 0.00028794444377374496}, "score": 2.374742235011873}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6036980942306271, "4": 0.2917873486705737, "3": 0.09502481604192907, "5": 0.007116238455309745, "1": 0.0023722571336283866}, "score": 2.6975768404249623}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9481446566168582, "1": 0.034506667939881816, "3": 0.017278782072598548, "4": 6.857551576415675e-05, "5": 1.272000118354954e-06}, "score": 1.9829130803810835}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8145501103470624, "3": 0.1622030878795861, "5": 0.02323889721840879, "1": 0, "2": 0}, "score": 3.8610347108800602}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6026002725475668, "1": 0.39409893387470474, "3": 0.003224179434578034, "4": 7.507409490837896e-05, "5": 1.4829866453611064e-06}, "score": 1.609279820414509}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9991227496093068, "3": 0.0008120935622456227, "1": 4.7684650705478405e-05, "4": 1.7131169087503956e-05, "5": 3.31577920713133e-07}, "score": 2.000799665991019}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7534052088178157, "3": 0.22750963268840796, "4": 0.010227252580956544, "1": 0.008810626757183155, "5": 4.6928096002077106e-05}, "score": 2.239294379387742}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.49549667778873013, "3": 0.28376041670662483, "2": 0.17711676050868824, "5": 0.04362502174530311, "1": 3.8821093427729234e-07}, "score": 3.40562948250256}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8422268946161936, "3": 0.1546198739986375, "2": 0.002721576421037937, "5": 0.00043043854366557724, "1": 0}, "score": 3.840367217522368}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.7941478706492324, "4": 0.13525041403544633, "5": 0.06909575381167751, "2": 0.0015051786251753312, "1": 0}, "score": 3.2719369559272136}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8178496755406515, "1": 0.18090455630986124, "3": 0.0012379010935941591, "4": 7.649035473272397e-06, "5": 2.731447397565456e-07}, "score": 1.8203494721920122}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9463459444231237, "4": 0.05343461617805548, "3": 0.00018866983033683407, "2": 1.5244801473646888e-05, "1": 1.4912765005535955e-05}, "score": 4.946082625699288}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6882430727706825, "5": 0.28651740334859266, "3": 0.024660968694550492, "2": 0.0005611698137156967, "1": 1.554754204000503e-05}, "score": 4.260687931500701}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5173600113011083, "4": 0.3917906531237032, "1": 0.07739929553831754, "3": 0.008003366606597232, "2": 0.005442966795243476}, "score": 4.266273811468909}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9576786899320272, "4": 0.042087339836110724, "3": 0.00018902202789254787, "2": 2.6064716928969807e-05, "1": 1.7311024588037024e-05}, "score": 4.957387110851798}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5046309545137638, "2": 0.489629664677706, "3": 0.00559066296755706, "4": 0.0001462109669681392, "5": 2.370622450401882e-06}, "score": 1.5012591743008679}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9996972344427446, "3": 0.00019934531216781248, "1": 7.779977646379948e-05, "4": 2.531792284983289e-05, "5": 2.2051811306803403e-07}, "score": 2.00017284294992}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8962079731953578, "3": 0.07089665682080719, "4": 0.03176057303824723, "1": 0.001029186700307273, "5": 0.00010561131952132737}, "score": 2.1337054500119272}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.99714476346348, "5": 0.0028011489687156128, "4": 4.610168765792376e-05, "2": 4.988965421786757e-06, "3": 2.1806643061315866e-06}, "score": 1.0113522604981575}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9983455912454489, "2": 0.001240430229831751, "4": 0.00032327344950646006, "5": 9.003284587922393e-05, "1": 0}, "score": 2.999262908415939}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9289958475356298, "1": 0.04616956796454917, "3": 0.023941036118145142, "4": 0.0008586767641378258, "5": 3.47297808963551e-05}, "score": 1.9795930081301014}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9089898563480319, "1": 0.08178053680941434, "3": 0.008833426389969775, "4": 0.0003914771537184646, "5": 4.487660673998956e-06}, "score": 1.9278492913115663}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9959665612532814, "4": 0.002186018776132586, "3": 0.0018045265874849098, "2": 1.4589697821230006e-06, "1": 0}, "score": 4.994200310832833}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9399858331017592, "5": 0.05996557688397161, "3": 4.559046336721228e-05, "1": 0, "2": 0}, "score": 4.059920166154193}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5529661449716267, "4": 0.43154508049461326, "3": 0.008687992317991756, "1": 0.005554971424545466, "2": 0.0012412041274809918}, "score": 4.525133249237336}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8990612190492715, "1": 0.09663154869861042, "3": 0.004154475882612706, "4": 0.00015024564049172774, "5": 2.459208519082143e-06}, "score": 1.9078307913419397}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.630131318029982, "3": 0.310619558559679, "4": 0.0591558258850772, "1": 7.27251711645258e-05, "5": 2.053068421334466e-05}, "score": 2.428920095084359}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.361764619868387, "2": 0.24936547189694522, "1": 0.1709317884523325, "3": 0.12580565291425233, "5": 0.09213132261499486}, "score": 2.9547981645744263}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4713993346099917, "2": 0.3663748827420959, "4": 0.1578315585112849, "5": 0.004391541388357124, "1": 1.9051229705483813e-06}, "score": 2.8002357929582606}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6205786250223638, "4": 0.28470366829719435, "5": 0.04897814993583952, "3": 0.04572925649624989, "1": 9.886889217272877e-06}, "score": 2.76206147101401}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4123779894959309, "2": 0.3465715805546279, "4": 0.2239982812830635, "5": 0.012110311490367487, "1": 0.004941882240539508}, "score": 2.891763564105715}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9738933823865757, "2": 0.02609255380983722, "3": 1.3561739526696345e-05, "4": 2.5928033138938153e-07, "5": 1.549887970090912e-07}, "score": 1.0261210773783709}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7634241533435351, "3": 0.19379410460170718, "4": 0.024827558821053978, "1": 0.017433523298068656, "5": 0.0005205378260621567}, "score": 2.2275773402133043}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9494888289416571, "2": 0.049342307581204836, "5": 0.0005904446268804308, "4": 0.0003006141527751654, "3": 0.000276710700520024}, "score": 1.0531594081043232}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9133095488612553, "3": 0.05808978779632196, "1": 0.026641343577257278, "4": 0.0018760426389593998, "5": 8.313672635543329e-05}, "score": 2.0354499446532164}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5099584638560352, "3": 0.4896427673428457, "1": 0.00034291375004974896, "4": 5.520058538150749e-05, "5": 5.384177990530015e-07}, "score": 2.4894119268121764}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9834246089137322, "1": 0.009632186770294524, "3": 0.006798219087490754, "4": 0.000142972536299317, "5": 1.9415964712112604e-06}, "score": 1.997457801998469}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9438062165383535, "3": 0.05565858196180911, "1": 0.0003829956218691534, "4": 0.0001518294054455393, "5": 3.0378822700132574e-07}, "score": 2.0555801605553166}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.46203056596106273, "2": 0.39846090139781326, "4": 0.1367680846984593, "1": 0.0018359682132102946, "5": 0.0009040688852295863}, "score": 2.7364432763639264}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4759342474031503, "4": 0.36422863150236945, "2": 0.15143799677720646, "5": 0.0082169843879867, "1": 0.00018188280624952647}, "score": 3.228860896734046}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9715909329293703, "2": 0.028394545844141562, "3": 1.4178632218650243e-05, "4": 1.643305317321858e-07, "5": 7.727309511190787e-08}, "score": 1.028423708063083}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9971339764097762, "3": 0.002790453085771079, "4": 6.489188374064314e-05, "1": 1.0550197266189443e-05, "5": 1.725717059814249e-07}, "score": 2.002910204242624}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.913607244950172, "1": 0.08163723580134254, "3": 0.004688977675136556, "4": 6.434946100164693e-05, "5": 2.205785227970899e-06}, "score": 1.9231870592017357}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8527310330754388, "4": 0.1003362332996794, "1": 0.04660126930112146, "3": 0.00024253561315457228, "2": 7.890397114580523e-05}, "score": 4.7125340245845795}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7733539684541513, "4": 0.19100094563102274, "3": 0.01921691112219253, "5": 0.016325266162025388, "1": 0.00010262900144642937}, "score": 2.450092097727744}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7151205994156515, "5": 0.1677536071888983, "3": 0.11271921224682649, "2": 0.004405531801910354, "1": 6.822586491822941e-07}, "score": 4.0462213015295925}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7654309273699769, "5": 0.12496888408342338, "3": 0.0929820700107195, "2": 0.016615820422027142, "1": 1.919728093350462e-06}, "score": 3.998749413571166}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982177680648591, "4": 0.001770365423057908, "3": 1.0337422444380456e-05, "2": 9.986324938541242e-07, "1": 0}, "score": 4.998205962882912}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9507384353125455, "4": 0.02743488500564833, "5": 0.015087540624030867, "3": 0.006733912177382755, "1": 4.578724921583622e-06}, "score": 2.106861794598907}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5881722687073017, "4": 0.4029942843058208, "3": 0.007845127033522081, "2": 0.0009865640579925332, "1": 5.307174853206807e-07}, "score": 4.578353129990799}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9949078027197173, "4": 0.005069870520845126, "3": 1.9080245979879654e-05, "2": 3.0376420043107593e-06, "1": 1.0481709061163546e-07}, "score": 4.9948824362603155}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4819318331177082, "4": 0.3493262429060195, "1": 0.09698664406601314, "3": 0.04125089374049163, "2": 0.030500914872468424}, "score": 4.088719485405951}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6094543684803001, "4": 0.3768586746941679, "3": 0.013608204446611538, "2": 7.470705693047912e-05, "1": 2.3269340855034277e-06}, "score": 4.595690792745423}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9748211896831642, "1": 0.02444871061584709, "4": 0.00072153137132188, "3": 5.917538437590913e-06, "2": 1.5519598599065293e-06}, "score": 4.901467026937712}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9897897194604047, "4": 0.009757396170111914, "1": 0.0003545443904302455, "3": 8.080772423811115e-05, "2": 1.6833476591519257e-05}, "score": 4.988612302432441}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9064859391946756, "3": 0.0530738786110205, "1": 0.025609886772568015, "4": 0.012968265776031817, "5": 0.0018618560731997942}, "score": 2.0589861018484807}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7338602819892893, "1": 0.2635633559141139, "3": 0.002518579315811756, "4": 5.407319317490424e-05, "5": 3.7394837156897354e-06}, "score": 1.739074596039848}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6772469036315458, "5": 0.22809884802760727, "3": 0.08549823897800654, "2": 0.00905797494423088, "1": 9.57591857288479e-05}, "score": 4.124197664182562}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5845683484527716, "5": 0.3479303718908188, "3": 0.032109742186014756, "2": 0.029824147345208375, "1": 0.005550051899534719}, "score": 4.239526332277382}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9294208265364153, "4": 0.07036485916695813, "3": 0.00021316692792676815, "2": 2.5741893035137803e-07, "1": 0}, "score": 4.929207971719048}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6213293396669615, "5": 0.36780613010450736, "3": 0.007718339721935788, "2": 0.002165074298722303, "1": 0.0009786041875452728}, "score": 4.352822715520325}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7946425087420672, "3": 0.08186244829876925, "2": 0.07743089638004927, "5": 0.027789889819196896, "1": 0.018273574118532646}, "score": 3.736244746354479}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984897331026119, "4": 0.0014754360584996863, "3": 3.278806436859559e-05, "2": 1.901118805676932e-06, "1": 0}, "score": 4.998453284237245}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8410988392943621, "3": 0.13650213820149398, "2": 0.01127436178082935, "5": 0.011111899698319095, "1": 1.1250758605356584e-05}, "score": 3.852027062180796}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6942626235203522, "5": 0.29446085645136927, "3": 0.009644702288757575, "2": 0.0014277778419951221, "1": 0.0002024875813428934}, "score": 4.281353572484296}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8129863168652551, "4": 0.18655846570329015, "3": 0.0004346022556415428, "2": 1.2883102357837028e-05, "1": 5.731776731474939e-06}, "score": 4.812510378336553}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5614088505712795, "4": 0.3499910836881114, "2": 0.08644927960242939, "5": 0.0019283289116789532, "1": 0.00022243536342997735}, "score": 3.2669535970186048}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6903294856018586, "4": 0.30153659310916786, "3": 0.007021755647330076, "2": 0.0010657787781099622, "1": 4.511359119413782e-05}, "score": 4.6810416987762835}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6442987261154866, "1": 0.31786026850073495, "4": 0.03532693411123407, "2": 0.001790021406969761, "3": 0.0007160060079838045}, "score": 3.6864193493932618}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9555371460729065, "4": 0.043691705516949134, "1": 0.00043517252339370235, "3": 0.0002567770138717305, "2": 7.614021372603547e-05}, "score": 4.953825488488463}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9208243329904718, "2": 0.07077028286078504, "3": 0.004510938743543481, "4": 0.0028527951812123502, "5": 0.0010394401791888619}, "score": 1.0925085110562183}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4070956943187109, "3": 0.3834294647974317, "2": 0.17384513583688782, "5": 0.034944478696232045, "1": 0.0006840366909777882}, "score": 3.3017718014981}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4995636158219976, "4": 0.29069731726339, "5": 0.2068102650514958, "2": 0.002924935060743463, "1": 2.106318333852303e-06}, "score": 3.701389934454755}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7394477907998226, "2": 0.1708873519643287, "4": 0.08895653494025389, "3": 0.0007052955663219099, "1": 0}, "score": 4.396968992822514}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9248230657836508, "4": 0.07459303803910146, "3": 0.0005824728401286766, "1": 0, "2": 0}, "score": 4.924241908451338}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8918665100602394, "5": 0.0836940994824287, "3": 0.02426021289374493, "2": 0.0001778532119234937, "1": 1.2045855404740822e-06}, "score": 4.059074573483349}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9953142475528624, "4": 0.00334113202425321, "5": 0.00114824682481569, "3": 0.00019615958908768497, "1": 8.104194311985979e-08}, "score": 2.010323084442728}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6210732432261769, "4": 0.37861023756075013, "3": 0.0003157019454757778, "2": 4.194325963965763e-07, "1": 0}, "score": 4.620756949374349}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964705603663118, "4": 0.003528358254263437, "3": 8.816250365152045e-07, "1": 0, "2": 0}, "score": 4.996469877790505}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963524276132634, "4": 0.003646413125141439, "3": 6.158206921242527e-07, "1": 0, "2": 0}, "score": 4.9963523532511935}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8633600132981621, "2": 0.08270935199270851, "4": 0.02316483228863692, "3": 0.022910636506300184, "5": 0.007855055042334457}, "score": 1.2294453674795915}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7461442745180341, "4": 0.23241525849150316, "2": 0.01956870641828107, "3": 0.0014407326644924267, "1": 0.000429947564386312}, "score": 4.704277047184812}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983811198025054, "4": 0.0016025759108919452, "2": 1.3962896450834833e-05, "3": 2.226481547255598e-06, "1": 0}, "score": 4.9983510822471855}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6260864552436618, "1": 0.36342802758626425, "4": 0.010118043134263129, "3": 0.00020532776540512635, "2": 0.00014139120583003652}, "score": 3.535304617525133}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7241009953393929, "5": 0.21716629120435907, "4": 0.056908958918874514, "3": 0.0009571561630912799, "2": 0.0008356255098217088}, "score": 2.042174258532118}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.772018056486243, "1": 0.22318117353364755, "3": 0.004760616987099941, "4": 3.885988785078397e-05, "5": 1.2934829715989293e-06}, "score": 1.78166104376056}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7872948107588194, "4": 0.16973526846849588, "2": 0.03694179178901025, "5": 0.005996082138218343, "1": 3.1668818649126565e-05}, "score": 3.1447223580275554}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.591772901516123, "5": 0.40265141762869133, "3": 0.005358967248407726, "2": 0.0001101105166195793, "1": 0.00010486161808825751}, "score": 4.396758335436341}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9959708207125821, "2": 0.0017490709810122802, "4": 0.001497758532706415, "3": 0.0004751464907009067, "5": 0.0003067538265378621}, "score": 1.0084196586509548}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7080198138614464, "3": 0.21499601197069937, "4": 0.07680261422652197, "5": 0.00014264300751186095, "1": 3.8819572214629794e-05}, "score": 2.3689903857995604}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.937803106305078, "4": 0.05618448656259332, "5": 0.0055551380761879685, "3": 0.0004529752815884192, "1": 4.17992606242133e-06}, "score": 2.1294831974507433}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.47177541137240026, "3": 0.33562409841815294, "2": 0.19018380114108246, "5": 0.0022193831102034676, "1": 0.00019715358769749564}, "score": 3.285636112798837}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8103904584451974, "5": 0.18186505917630907, "3": 0.00473071464572406, "2": 0.003012323111691636, "1": 1.2402866942881666e-06}, "score": 4.171106012409961}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9059362496858643, "4": 0.08018434360998976, "3": 0.012592599233628713, "5": 0.0011913901028069147, "1": 9.511075531620895e-05}, "score": 2.176440400105526}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8750027935509167, "3": 0.10071541626116719, "2": 0.01826591726822462, "5": 0.006011947738460702, "1": 3.535707985094324e-06}, "score": 3.8687540387000987}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6069121479171417, "3": 0.34766514133448, "2": 0.026482323666691933, "5": 0.018827626370392612, "1": 0.00011218188844101122}, "score": 3.617861070846461}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.840558539613684, "4": 0.15914796691216582, "3": 0.00029122831814290453, "2": 1.2947732172021703e-06, "1": 2.7348665765103216e-07}, "score": 4.840264486866205}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9989292964125687, "4": 0.0010696305184514044, "3": 9.128493275829727e-07, "1": 0, "2": 0}, "score": 4.998928543611225}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7819989821782602, "4": 0.21595051386992486, "1": 0.0011155865037881622, "3": 0.0008395148437057154, "2": 9.264792514806166e-05}, "score": 4.77762955409283}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6507024222230243, "4": 0.34825538618836593, "3": 0.00095716726616717, "2": 7.813511392864924e-05, "1": 0}, "score": 4.649593459913794}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6420091840632671, "2": 0.35764285580793764, "3": 0.0003456011131912723, "4": 2.113747752521887e-06, "5": 2.2737208964321105e-07}, "score": 1.3583413151787274}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8429194138784158, "1": 0.15675100311999224, "3": 0.000327077634785298, "4": 2.3392808614384913e-06, "5": 1.5554185150934695e-07}, "score": 1.843581218052776}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9743488024972978, "1": 0.017801153863374216, "3": 0.0077696613488422335, "4": 7.893901228755177e-05, "5": 1.4079131294015957e-06}, "score": 1.9901306089003996}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9581999343950334, "2": 0.041711350206807135, "3": 7.99112431358096e-05, "4": 4.730058441688881e-06, "5": 3.900522653850115e-06}, "score": 1.0419009722319355}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9646258847586711, "5": 0.03511411825133872, "4": 0.00022428051286363645, "3": 2.2382234868281094e-05, "2": 9.399820167390384e-06}, "score": 1.1411840343114334}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8239884056374481, "2": 0.17178297021251474, "3": 0.003726769151123292, "4": 0.00031016318368517196, "5": 0.00019159285200244966}, "score": 1.1809333873795784}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9941133672197705, "4": 0.0045409283747648525, "3": 0.0011806312805975538, "5": 0.0001631451928438267, "1": 1.8745067496563496e-06}, "score": 2.010750049676233}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9973644453884605, "4": 0.002630841294773836, "3": 3.8898148417057194e-06, "1": 0, "2": 0}, "score": 4.997361376902631}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5476902659198124, "4": 0.44217823127693284, "3": 0.009598017617587475, "2": 0.0005273007442464307, "1": 5.443441872577006e-06}, "score": 4.537021714420963}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7139927291198037, "4": 0.2827570303794165, "3": 0.0031080710076608294, "2": 0.0001355560974498936, "1": 4.6811347943612585e-06}, "score": 4.7106008755791295}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8975736919213657, "3": 0.09284598814805507, "5": 0.008636996361094378, "2": 0.0009414340124524089, "1": 1.6916350695119246e-06}, "score": 3.9139030482424486}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9953147223178717, "3": 0.0038928229128352624, "2": 0.0006732081428392265, "5": 9.947700957955962e-05, "1": 1.8379125887041285e-05}, "score": 3.994805093209933}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9944179922254458, "4": 0.0055184790007752, "3": 4.08821099558227e-05, "1": 1.983463313519274e-05, "2": 2.041830190709836e-06}, "score": 4.994314288377063}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9787301439841487, "4": 0.021173577901807804, "3": 6.46820389562943e-05, "2": 2.895901510008623e-05, "1": 9.174892258769877e-07}, "score": 4.978606474230394}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999238765575363, "4": 7.198894445314422e-05, "3": 1.5732391564643135e-07, "1": 0, "2": 0}, "score": 4.99992769612015}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6676769034000779, "5": 0.33003139258521036, "3": 0.002280545523367813, "2": 5.566478111327317e-06, "1": 0}, "score": 4.327741546840686}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7358548900132453, "5": 0.21846877081349225, "3": 0.032329233375713654, "2": 0.012447900560123053, "1": 0.0008988534960585702}, "score": 4.158547231596977}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.960278746240085, "4": 0.03962599249127273, "3": 9.399067337798278e-05, "2": 3.5440624395057154e-07, "1": 0}, "score": 4.960184926465106}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9675353047947921, "4": 0.03241664349367561, "3": 4.320739054135882e-05, "1": 2.4616049550545927e-06, "2": 1.2650056112802047e-06}, "score": 4.967483263944294}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9698585818699773, "4": 0.022076075795976296, "1": 0.007533104785802706, "3": 0.0003433086710094689, "2": 0.00018670196174498497}, "score": 4.946544662793041}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.712109462443437, "1": 0.2721968394401198, "4": 0.009488658838537103, "2": 0.003788189797412394, "3": 0.0024083420843938655}, "score": 3.8855332486298644}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6653101873074716, "3": 0.17012141346434326, "5": 0.09748367021303755, "2": 0.057399585324187666, "1": 0.009683670167669944}, "score": 3.7835117565968406}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5658623659778099, "4": 0.3450362827807687, "5": 0.07155323219969939, "3": 0.017547478756302155, "1": 0}, "score": 2.9222803314395867}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.34279153029085213, "3": 0.30420489740296447, "4": 0.2483065766771045, "5": 0.05834302877303106, "1": 0.04634871088399934}, "score": 2.929503311635692}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9937666501361192, "1": 0.0035890077767134414, "3": 0.002636544027264626, "4": 7.619727119470972e-06, "5": 5.533362866239623e-08}, "score": 1.9990629415904184}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7678134108308938, "5": 0.2217490149426633, "3": 0.010412291455219474, "2": 2.312620888093039e-05, "1": 0}, "score": 4.211290926731738}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7659793713167984, "4": 0.233698302745266, "3": 0.00030962334975106234, "2": 8.373923716283414e-06, "1": 0}, "score": 4.765656314388899}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7334675223652778, "3": 0.2487267188217213, "2": 0.01116491507587201, "5": 0.006630695356282378, "1": 9.721554736190075e-06}, "score": 3.735544868842253}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5426771299711634, "4": 0.44616591027642455, "2": 0.01050511077250177, "5": 0.0006458934537887777, "1": 5.470032500267756e-06}, "score": 3.436941858478985}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6316776262628747, "2": 0.21526455907124314, "5": 0.08212158384986859, "3": 0.05548680690008863, "1": 0.01544632141661056}, "score": 3.5497652977046066}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9294383221187219, "3": 0.06090591393694641, "4": 0.009479677332031564, "1": 0.0001022575425491567, "5": 7.380478434028314e-05}, "score": 2.079984427353936}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6776144436345097, "5": 0.22134486912308016, "3": 0.07573820926312262, "2": 0.025189375009031283, "1": 0.0001129300451978356}, "score": 4.094889136115011}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7850381057666292, "4": 0.12189250856033462, "5": 0.08769830561763889, "2": 0.005353908093403652, "1": 1.5719933519682278e-05}, "score": 3.2919041956883737}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7594345923573155, "4": 0.14734896410344045, "3": 0.05249762229653359, "5": 0.04071717033277004, "1": 9.945947193501969e-07}, "score": 2.4693463749461753}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9304640860913841, "2": 0.06771727240962065, "4": 0.0017019034122510452, "5": 0.0001145579785782163, "1": 1.7894200231990486e-06}, "score": 2.9342101424164233}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5495790815635695, "2": 0.2757539214268638, "3": 0.17411163587623302, "5": 0.0005500826600666774, "1": 5.014494195309166e-06}, "score": 3.2749153690403516}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9881410873181992, "2": 0.011836369815018545, "3": 2.1897611303286376e-05, "4": 4.663721110047467e-07, "5": 1.098909858811925e-07}, "score": 1.0118820045376693}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.746970377442804, "3": 0.1612441666136506, "4": 0.061276136635318806, "1": 0.016312824522459107, "5": 0.014195418603339068}, "score": 2.3100702048639525}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9647312672108854, "4": 0.021153758128160314, "1": 0.013123969340840005, "3": 0.0005438473266707887, "2": 0.0004410229248860272}, "score": 4.923939134441856}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9626921128220318, "1": 0.0320815365399578, "4": 0.005055108312166917, "3": 8.575089797168944e-05, "2": 7.639288457225771e-05}, "score": 4.866216847846538}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6598861558343848, "5": 0.33212313176963415, "3": 0.007959783324790784, "2": 3.0047442763156727e-05, "1": 0}, "score": 4.3241035392982115}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6461952475988574, "3": 0.3194167188560266, "2": 0.030220704803215294, "5": 0.0038069573678605312, "1": 0.0003601197294505878}, "score": 3.622868374813918}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9734112726045526, "4": 0.026502206110557616, "3": 8.596648903780257e-05, "2": 1.939881038740695e-07, "1": 0}, "score": 4.973325269322605}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7545482146746203, "5": 0.22737942070043188, "3": 0.017648596803170862, "2": 0.00041113069554116015, "1": 9.786535945918014e-06}, "score": 4.208879798329066}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8720869733208665, "4": 0.12690309693861088, "3": 0.000813060854039971, "2": 0.00015342065962044779, "1": 4.232671969736064e-05}, "score": 4.870841067642989}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8084223068548995, "5": 0.11609609797688293, "3": 0.04071300925059695, "2": 0.03476375353825995, "1": 0}, "score": 4.005855609946295}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9260819215986132, "1": 0.059086925841444246, "3": 0.014634412545888962, "4": 0.0001933909055682134, "5": 3.2943258790505923e-06}, "score": 1.9559441490797238}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9673567955199077, "2": 0.027987150076077716, "4": 0.004261591060713079, "5": 0.0003914921867297991, "1": 2.5360976921248584e-06}, "score": 2.977052343179129}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.8325606890706782, "3": 0.1499390501191975, "4": 0.014868788419606142, "5": 0.0026289212185536385, "1": 1.798533405308834e-06}, "score": 2.187561733246858}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6161470354617925, "5": 0.3582223843865349, "3": 0.02384399918034957, "2": 0.0017597220650281769, "1": 2.5264053065849475e-05}, "score": 4.330783676468346}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8848179511939044, "5": 0.11194318647554041, "3": 0.003082556480936146, "2": 0.00015488626261206043, "1": 0}, "score": 4.108551011566986}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9273605974888502, "4": 0.07226270642344046, "1": 0.00018192537180616457, "3": 0.00016619346440373953, "2": 2.735683915074108e-05}, "score": 4.926595045058762}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9951608585557765, "4": 0.004831721773475827, "3": 7.38398568069321e-06, "2": 2.150300809938941e-08, "1": 0}, "score": 4.9951534456774045}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8671631346345565, "4": 0.1326954534632435, "3": 0.00014033936961380187, "2": 4.915663065242285e-07, "1": 0}, "score": 4.86702231584306}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6445968347644467, "4": 0.35452472121396134, "3": 0.0008455662810263168, "1": 1.9469488696869626e-05, "2": 1.2782953914535226e-05}, "score": 4.643667696593595}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9980628900239892, "2": 0.0019363155746044017, "3": 7.312013284500983e-07, "5": 1.775914930540578e-08, "4": 1.1067720813461773e-08}, "score": 1.0019378822836322}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5440673688477775, "3": 0.2199522723564085, "4": 0.11651470392409051, "1": 0.11552332746724367, "5": 0.00394171252141484}, "score": 2.349283705070226}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7780362204804261, "5": 0.17591627629426274, "4": 0.03671474255820704, "2": 0.006829840216747203, "3": 0.002499780377417336}, "score": 1.8256413263972409}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8241046538812085, "5": 0.12086648165976666, "4": 0.04679474821423304, "2": 0.0053327224105151555, "3": 0.0028956142914002025}, "score": 1.6349777921564568}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8112738762207614, "4": 0.18367472218732692, "3": 0.0040394016678281545, "1": 0.0005103105989871554, "2": 0.0005001072412700871}, "score": 4.804704601383566}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9189923692313882, "2": 0.06996391289048891, "3": 0.009936193294747672, "5": 0.001105794718778647, "1": 9.31180221493403e-07}, "score": 3.851238863289193}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7481197501783384, "3": 0.238157133112578, "5": 0.011940025921979253, "2": 0.0017813670568147433, "1": 1.1878352798048592e-06}, "score": 3.770216472050086}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6155833402533516, "4": 0.3759276779390014, "3": 0.008474640885548567, "2": 9.318554852819246e-06, "1": 0}, "score": 4.607093111302654}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9726433419790061, "5": 0.014687570310372875, "4": 0.011666680738551535, "2": 0.0006532264530897844, "1": 0.0003476195233538431}, "score": 3.039693417820752}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5241486246759999, "4": 0.45905268195807863, "5": 0.015142795570995267, "2": 0.0016486574317703165, "1": 6.916698483099938e-06}, "score": 3.4876759401148063}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8483971122987161, "3": 0.07942238686728711, "5": 0.07097764575763683, "2": 0.001190350354076512, "1": 1.1298122460377155e-05}, "score": 3.9891406507119274}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4988851849430202, "4": 0.473836477966732, "1": 0.013331281671682996, "3": 0.010598137509004868, "2": 0.003342888584828837}, "score": 4.441610087859933}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.524384282442907, "2": 0.4704012147614559, "4": 0.00466408036110423, "1": 0.0005366170748690373, "5": 1.3750161341407374e-05}, "score": 2.5332171060069606}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7786421341491909, "3": 0.14213920282189824, "5": 0.06779410735371261, "2": 0.011152056038538975, "1": 0.00027122630819069823}, "score": 3.9025369894277384}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.952709561601842, "4": 0.04721706052017184, "3": 7.251566140885502e-05, "2": 3.4704895023115e-07, "1": 0}, "score": 4.952636842610194}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4862320985735912, "3": 0.3382826129078533, "4": 0.11844590743099906, "5": 0.03450919392042478, "1": 0.02252982481952183}, "score": 2.6561724224741132}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5384497508092999, "3": 0.20253618845140245, "4": 0.19381732252616435, "1": 0.053873304610501015, "5": 0.01132297648951601}, "score": 2.570266719038176}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7864140532108814, "4": 0.21112905445264268, "3": 0.002423555505277785, "2": 3.078912545411832e-05, "1": 2.2721500867004925e-06}, "score": 4.783922319018666}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2974403435460763, "5": 0.27348491883816084, "2": 0.21829127154205094, "1": 0.1598732444355543, "3": 0.050907791117387274}, "score": 3.30637316545558}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7796918199502445, "5": 0.1984729222497269, "4": 0.020201633732477377, "2": 0.0010842993076596405, "3": 0.000544378217460376}, "score": 1.8566738835126348}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8710595977137894, "1": 0.12548229576037526, "3": 0.003444977175285008, "4": 1.2948106457602408e-05, "5": 2.388364091315123e-07}, "score": 1.877989301163931}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6787920619026739, "2": 0.3209666356625748, "3": 0.00023984708104714768, "4": 1.2557619978899549e-06, "5": 1.446249495884443e-07}, "score": 1.3214506932795629}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6516261963154393, "4": 0.3383120786066501, "3": 0.01004111615581171, "2": 1.9409809021744474e-05, "1": 0}, "score": 4.641547029829018}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957162863879642, "4": 0.0042748212086757, "3": 8.414652722821515e-06, "2": 2.815688040138588e-07, "1": 0}, "score": 4.995707503937356}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9873796105559117, "3": 0.011456153153582367, "4": 0.0011533609889612109, "1": 8.182629534673125e-06, "5": 2.601584176057865e-06}, "score": 2.0137624985080946}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6772815186053686, "1": 0.31942639732923617, "3": 0.0032158084210784405, "4": 7.46765079918784e-05, "5": 1.5830930468290093e-06}, "score": 1.683943508316384}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8456035129900151, "3": 0.14416603828565955, "4": 0.009526317950830669, "1": 0.0006116512443856664, "5": 9.230271517877487e-05}, "score": 2.1628839598886245}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982682490141416, "4": 0.001721248120260753, "3": 9.716782624463903e-06, "1": 1.5287304977675075e-07, "2": 0}, "score": 4.998258705719685}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5001938778588828, "4": 0.4513999163098617, "5": 0.030813329704880727, "2": 0.01757949171197554, "1": 1.2765389431252325e-05}, "score": 3.495421859907286}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8446942934361412, "5": 0.11211225868236548, "3": 0.04312957596182898, "2": 6.229514902311499e-05, "1": 0}, "score": 4.068858200996079}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8334344284599344, "4": 0.11949099094907453, "3": 0.03909238062132783, "5": 0.007975280169153234, "1": 6.814533139531364e-06}, "score": 2.3019934202838503}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6210912546113943, "1": 0.37767350499624214, "4": 0.001083623241034746, "2": 7.984933591452626e-05, "3": 4.8433104537526485e-05}, "score": 3.487850656989457}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9910212697165312, "1": 0.005918454075993648, "4": 0.0029579110090021256, "3": 6.246182424022877e-05, "2": 3.743314560144436e-05}, "score": 4.973130983229123}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9437777763103354, "5": 0.05551853222514684, "2": 0.0005343101940072385, "4": 0.0001480195793566148, "3": 1.8709540070413646e-05}, "score": 1.2230905085825392}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5642443368116945, "5": 0.43301080390897073, "4": 0.002145593660698691, "2": 0.00040538736142487164, "3": 0.0001542833054264376}, "score": 2.739262816617622}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.937951478492426, "4": 0.03944312176987062, "2": 0.022574715098053193, "5": 2.641794615918287e-05, "1": 4.2736127977020385e-06}, "score": 3.0169126952215164}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9768890356517036, "2": 0.02302379575125193, "3": 8.33480787019129e-05, "4": 3.56937160026932e-06, "5": 1.868331246597307e-07}, "score": 1.0232019488481565}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5746512752459438, "4": 0.3880068984525639, "1": 0.015956235271980847, "3": 0.01382636503139168, "2": 0.0075581381165684474}, "score": 4.497840469756935}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9878058555728857, "3": 0.006415459849547777, "4": 0.005767872407480294, "5": 1.0253617375055695e-05, "1": 5.059504992568529e-07}, "score": 2.0179814605119986}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.822312266344936, "5": 0.15498013989219184, "3": 0.022444380678008878, "2": 0.000262460227945594, "1": 0}, "score": 4.1320109381436385}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9279735442069423, "2": 0.06482535313887092, "3": 0.005196676460212879, "4": 0.0017043300125323493, "5": 0.00029977181181952957}, "score": 1.0815308097902896}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.70204109274201, "4": 0.2939532611387417, "3": 0.003814066256635607, "2": 0.00018329072582626605, "1": 5.658413530521631e-06}, "score": 4.697845305631005}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9653386659890214, "4": 0.03228024647747596, "3": 0.0012614116853291051, "2": 0.0009651253197800288, "1": 0.00015366924884705285}, "score": 4.9616868434325365}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8446742997588417, "4": 0.13138478120460706, "3": 0.02375981905611657, "2": 0.0001780762016719366, "1": 0}, "score": 4.820560809493729}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9516597676414033, "2": 0.047553542130984595, "4": 0.0005784950893255614, "5": 0.00020542881152101178, "1": 2.251047262581478e-06}, "score": 2.953431284490953}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6511049215137719, "3": 0.30728574463623987, "4": 0.023926907894879952, "1": 0.017623430216163194, "5": 5.863164441797559e-05}, "score": 2.3376921480949537}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6239676593004372, "2": 0.37486200777476647, "3": 0.001155388070114198, "4": 1.4256380458310532e-05, "5": 4.840299751593878e-07}, "score": 1.377217566296232}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8380065686887895, "3": 0.13255041703570952, "2": 0.028866740336856957, "5": 0.0005743911199769028, "1": 1.6598256354472365e-06}, "score": 3.810285471628629}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9371818113255111, "5": 0.05749443031255174, "4": 0.004914690489503236, "1": 0.0002943776768210341, "3": 0.00010965987805687271}, "score": 2.1821288702839508}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8437294859829984, "3": 0.15584937235727991, "5": 0.0003793404011174, "2": 3.8576452750862955e-05, "1": 0}, "score": 3.844452313527246}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9195503577391781, "1": 0.07498537383478715, "3": 0.0054602374563336225, "4": 3.821383607532396e-06, "5": 7.418498987698673e-08}, "score": 1.9304827195310144}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7912004815827264, "4": 0.1140576222449064, "2": 0.09398458495503409, "5": 0.0006952713895911238, "1": 6.139488699350768e-05}, "score": 3.021340804058622}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8830571481771791, "5": 0.04825378541874549, "3": 0.032148856390137245, "2": 0.02782490488931876, "1": 0.008710654042060473}, "score": 3.93432285165395}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6690691439561776, "3": 0.17926532644099874, "1": 0.13417622917196978, "4": 0.017242534703304765, "5": 0.00024639145654964715}, "score": 2.080313371104253}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7827278475300906, "4": 0.2116026194121881, "3": 0.0056530073561914095, "2": 2.1415107929537446e-06, "1": 0}, "score": 4.777081734844206}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5985561143899221, "5": 0.24173891472299286, "3": 0.13608050770107483, "2": 0.023136449606390382, "1": 0.0004873082881248313}, "score": 4.057923623797802}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5105836172404578, "4": 0.3344212677711041, "1": 0.10339159566983698, "3": 0.033052436294012576, "2": 0.01855010740348818}, "score": 4.130256306210758}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.561812620592234, "3": 0.26700414402752276, "2": 0.1449203207018312, "1": 0.01569381489470661, "5": 0.010568250588872946}, "score": 3.4066415165966104}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971472488499004, "4": 0.002843054149184308, "3": 5.525007240851276e-06, "1": 2.3611494557017927e-06, "2": 1.031327242793248e-06}, "score": 4.997133355022184}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5426385415724778, "5": 0.4529800247255168, "3": 0.004234144408407512, "2": 0.00014358548296772013, "1": 3.544246405950394e-06}, "score": 4.448448148168237}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9881125645433072, "2": 0.011880771809836006, "3": 6.181120452095434e-06, "4": 2.556342819504398e-07, "5": 6.152483023241236e-08}, "score": 1.0118941490198101}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8454436329380798, "3": 0.1345531487502739, "1": 0.010700187653048242, "4": 0.00898314082521495, "5": 0.0003197580314231911}, "score": 2.1427785356604163}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5660441501627392, "3": 0.25860729589275433, "4": 0.13067488949906506, "1": 0.043803765279900875, "5": 0.0008692737196146944}, "score": 2.4787614302092136}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9865993569170632, "2": 0.011355981153273402, "3": 0.001772355191882064, "4": 0.00021829657149627195, "5": 5.319559318053653e-05}, "score": 1.015768376468744}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.353472602565439, "1": 0.26986242145911055, "2": 0.18776620133442246, "4": 0.14478373973265846, "3": 0.04410696378670816}, "score": 3.1242389033581968}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7061938811480288, "5": 0.2844185380956475, "3": 0.009353022742125154, "2": 3.36448351844494e-05, "1": 0}, "score": 4.274998476805992}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6741156467994308, "4": 0.3254889713788991, "3": 0.00039284108175505867, "2": 1.0595990246900365e-06, "1": 0}, "score": 4.673721684396361}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9738460123906344, "4": 0.02606929744999401, "3": 8.411816680373204e-05, "2": 1.8936224804615972e-07, "1": 0}, "score": 4.9737618880901575}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7448995514212854, "5": 0.23769218089582747, "3": 0.01700180098913279, "2": 0.0003933207976743468, "1": 1.0116831864348997e-05}, "score": 4.219874053828381}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7513652228887014, "4": 0.24643825590981802, "3": 0.002193119542693303, "2": 1.0923240233239322e-06, "1": 0}, "score": 4.749171648786093}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.45368280160803137, "4": 0.3319030734932661, "1": 0.18006371833173546, "3": 0.018038087218245107, "2": 0.01631116722367983}, "score": 3.862831066911457}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.699441052035141, "4": 0.2396755608447284, "2": 0.055426109812476934, "5": 0.005426971692303845, "1": 3.0167692227881852e-05}, "score": 3.1950430859333543}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5001287568554549, "2": 0.4474975124739978, "4": 0.05043992272019969, "1": 0.0017258372222660793, "5": 0.00020787242661721823}, "score": 2.5999064413251216}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6589260936566558, "3": 0.28786236856431613, "4": 0.05287915833893698, "5": 0.00033098218691569826, "1": 1.2439223316019148e-06}, "score": 2.3946124483868654}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8834509116497332, "4": 0.046914602408325165, "5": 0.041464501638434376, "2": 0.024707832014547803, "3": 0.003459725597978831}, "score": 1.3382299177687094}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.48640551985911995, "2": 0.3035892932674529, "4": 0.20837765427914684, "5": 0.000826125053015464, "1": 0.0008012472354754463}, "score": 2.904838101391771}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9428414585806485, "1": 0.03923619564217251, "3": 0.01730343227080774, "4": 0.0006111433566773212, "5": 7.621216921746258e-06}, "score": 1.9793123839116906}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.870082120855675, "1": 0.08683242214878176, "3": 0.03847972883950003, "4": 0.004487678270231115, "5": 0.00011806006943721382}, "score": 1.9609768438368893}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8979545539805897, "4": 0.10149451716887117, "2": 0.00031471502850924637, "3": 0.0001969725852652874, "1": 3.851314293463941e-05}, "score": 4.897013265019326}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8559247975749622, "5": 0.1201355368290579, "4": 0.021610263826503284, "2": 0.001891971257621159, "3": 0.0004342435526699611}, "score": 1.5481351440430346}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"1": 0.955809087634838, "2": 0.044174211959325485, "3": 1.648020655309341e-05, "4": 1.8051752003103845e-07, "5": 1.6220174986507207e-08}, "score": 1.0442077798428764}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9869398003124651, "1": 0.010312299189956459, "3": 0.0026520615447725186, "4": 9.338330276160448e-05, "5": 2.3847601612532254e-06}, "score": 1.9925336827115365}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.787268342352218, "1": 0.21245452787215846, "3": 0.0002756727731944306, "4": 1.3472258576752368e-06, "5": 1.247939324976824e-07}, "score": 1.7878242169208696}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5375423668715564, "3": 0.3112053485401243, "2": 0.14322129892583707, "5": 0.007746496518165373, "1": 0.00028377922468149493}, "score": 3.4092467930650217}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6169086630435074, "4": 0.37394570720745096, "3": 0.008069452038975645, "2": 0.0007013358390438575, "1": 0.00037243687410332073}, "score": 4.606320686903517}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7471942929586342, "1": 0.2441213112467039, "3": 0.008547569546596292, "4": 0.00012934853179945733, "5": 7.271917834784104e-06}, "score": 1.7647067226940083}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6425013506731194, "2": 0.35684955520996914, "3": 0.0006409276358539455, "4": 6.523372898933821e-06, "5": 1.5793739873113164e-06}, "score": 1.358157320923183}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7553709695566782, "3": 0.22379547550448084, "4": 0.012725842633439958, "1": 0.006160979526721141, "5": 0.0019465227564966637}, "score": 2.2489258017940696}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9833571679666294, "5": 0.016495185970653102, "3": 0.00013939959011411896, "2": 7.773002858258484e-06, "1": 0}, "score": 4.016340248111435}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9954027046624324, "5": 0.003215334124316578, "2": 0.0012869614554010065, "3": 6.281673745601682e-05, "4": 3.1757266267209766e-05}, "score": 1.014369209344131}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9856844608682852, "2": 0.014308056625243466, "3": 6.990667588890132e-06, "5": 1.8104431525227748e-07, "4": 1.5780764220781467e-07}, "score": 1.014323237751877}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.658480072642035, "3": 0.21558950914788158, "4": 0.12138980287159169, "5": 0.0031083550983336773, "1": 0.0014322638136532238}, "score": 2.4662619147062284}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8339032587951692, "3": 0.11754735562448074, "5": 0.04458659614460953, "2": 0.0039529252679273985, "1": 9.358954241987563e-06}, "score": 3.9191052722524335}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9881701830667975, "4": 0.01181483894307342, "3": 1.4273469836593292e-05, "1": 0, "2": 0}, "score": 4.988156605773342}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.47195213850996315, "4": 0.2587362437673444, "2": 0.1364508230453841, "5": 0.08030792263057164, "3": 0.052548611734527656}, "score": 2.338994172871981}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.998998535101024, "4": 0.0009980581667845163, "3": 2.642217582584101e-06, "1": 3.3784994153446347e-07, "2": 2.105509858686739e-07}, "score": 4.9989946741280615}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999759659438225, "4": 2.2859746246209743e-05, "3": 4.1777409211615467e-07, "1": 0, "2": 0}, "score": 4.999976304687644}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983951375711873, "4": 0.0011092518499035973, "1": 0.00046280377768740955, "3": 2.64391418503386e-05, "2": 5.954359009460278e-06}, "score": 4.996968790425818}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9981210822800872, "2": 0.001468889361716684, "4": 0.00040525461880179596, "5": 4.618308709911695e-06, "1": 0}, "score": 2.9989456017106195}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944474633332073, "1": 0.00534520971254387, "4": 0.00020238029135913893, "3": 2.6098286242300623e-06, "2": 9.775836238991913e-07}, "score": 4.97840859910222}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5941969196476312, "5": 0.3836262529374992, "3": 0.01631684939271613, "2": 0.005856830453282941, "1": 2.9362185851508717e-06}, "score": 4.355587009135878}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9347752153381053, "1": 0.03505780178900124, "4": 0.029808097326942423, "2": 0.00017962773275741572, "3": 0.0001744242513937471}, "score": 4.829072137625607}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9599984078607652, "4": 0.03991742634231776, "3": 8.021010929305267e-05, "2": 2.086529288228296e-06, "1": 0}, "score": 4.959915818927551}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8447743489076988, "4": 0.14273116258917867, "1": 0.01112530317072522, "3": 0.0008374223625457561, "2": 0.000528931830102815}, "score": 4.809505445195815}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995797824361426, "4": 0.0003848393051609278, "1": 3.173421885912121e-05, "3": 2.541388430750063e-06, "2": 5.223369287010641e-07}, "score": 4.999481573730905}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9285899557561412, "2": 0.07102489710202944, "3": 0.0003772776007389573, "4": 7.386925091898159e-06, "5": 4.198677735994213e-07}, "score": 1.071803297055407}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7728789425253492, "1": 0.21468664051436948, "3": 0.011417325460928305, "4": 0.0010082380263066344, "5": 7.818905303271865e-06}, "score": 1.7987704095294386}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9779511627818822, "2": 0.022034245990365114, "3": 1.4321008112386343e-05, "4": 1.0488010461690489e-07, "5": 4.858742909962026e-08}, "score": 1.0220633995725688}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.7450093875080642, "4": 0.16446794351763389, "2": 0.08886470805853179, "5": 0.001655242756905559, "1": 1.7899014419332048e-06}, "score": 3.0789102144190217}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7628166332305252, "1": 0.23584577107096674, "3": 0.0006812565481974917, "4": 0.0006478761541607998, "5": 8.358596731839664e-06}, "score": 1.7661562891626006}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9071541022921307, "1": 0.08973172441829348, "3": 0.0030799109338375073, "4": 3.36538532086401e-05, "5": 5.502863818287541e-07}, "score": 1.9134171400405864}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9066339713694446, "1": 0.09281266242063592, "3": 0.0005506100569416715, "4": 2.635796881156234e-06, "5": 2.8660212501687207e-08}, "score": 1.9077432967511454}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7436658510266875, "5": 0.24438654656203784, "3": 0.011646592861325553, "2": 0.0002832530189104949, "1": 1.7341067944735167e-05}, "score": 4.232121520896983}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7624286565945203, "3": 0.16618062163821692, "4": 0.06736996389033431, "1": 0.0030583277479336655, "5": 0.0009604659756159618}, "score": 2.300744210305557}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5881349209540425, "5": 0.3993343072984787, "3": 0.012370347510067858, "2": 0.00014300513775401783, "1": 0}, "score": 4.3866846852119705}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9016014572181016, "2": 0.0979616209475555, "3": 0.0004191238906521476, "4": 1.3542793461223478e-05, "5": 4.004679522485914e-06}, "score": 1.0988565405880013}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8151230952741821, "2": 0.18480122333838653, "3": 7.502388713525793e-05, "4": 5.891429401323971e-07, "5": 1.0090321972868294e-07}, "score": 1.184953436134887}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7642772446310127, "1": 0.2326037306774934, "3": 0.0030768036402557945, "4": 3.403136359075215e-05, "5": 8.164876150478474e-06}, "score": 1.7705656246257853}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7216655316400814, "5": 0.23259051916080153, "2": 0.03076641518531277, "4": 0.011159133147511434, "3": 0.0038109015139441544}, "score": 2.0022352104139207}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8907413548644355, "1": 0.10571416328021857, "3": 0.0035004130610759806, "4": 4.247372111426013e-05, "5": 1.397656014312152e-06}, "score": 1.8978753700299764}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"2": 0.590883975381857, "1": 0.40756705813467975, "3": 0.0015209132533110677, "4": 2.6960789182518115e-05, "5": 9.760265968829065e-07}, "score": 1.5940106575137925}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8021881641446846, "2": 0.19770447771956765, "3": 0.00010675660865463401, "4": 5.858816677076281e-07, "5": 1.1427020200528916e-07}, "score": 1.1979201861428537}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7974886949778305, "4": 0.2006094090535898, "3": 0.0018244919760267847, "2": 5.702635662912958e-05, "1": 1.2588938832465524e-05}, "score": 4.795518579525296}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9990374324656285, "2": 0.0006203544188155581, "5": 0.00020443192969897648, "4": 7.992363033847915e-05, "3": 5.628694119941929e-05}, "score": 1.0017904297231004}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8209397157972668, "3": 0.1482022031753826, "1": 0.02311668795456991, "4": 0.0076625948448650035, "5": 7.832670132567266e-05}, "score": 2.1406457513327317}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"2": 0.921859143382984, "1": 0.06397427049315811, "3": 0.013857776829473941, "4": 0.0002943401460598764, "5": 1.4364121830225348e-05}, "score": 1.9505152737967189}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5423359150800041, "5": 0.44948879638379796, "3": 0.008072129120186348, "2": 9.866976408970529e-05, "1": 2.372915951040263e-06}, "score": 4.44121314291931}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6960566209617994, "4": 0.25969287401116675, "3": 0.044242429805742875, "2": 4.1405290021206086e-06, "1": 0}, "score": 4.651808474763832}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7962455984184178, "5": 0.2015629377926221, "3": 0.002183823586006621, "2": 6.543338818899964e-06, "1": 0}, "score": 4.199366246206663}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7295120813636166, "4": 0.26879716964045014, "3": 0.0012912304216095905, "1": 0.0002598286974633177, "2": 0.00013772756372040285}, "score": 4.727167336652196}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8603387258607481, "1": 0.10159465027476519, "3": 0.03512169318357261, "4": 0.002911266701207118, "5": 3.2918919654283356e-05}, "score": 1.9394482879555226}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9267546086940724, "3": 0.043060765917009, "1": 0.029009828285932602, "4": 0.001164819196670039, "5": 9.954558211364236e-06}, "score": 2.016410440082203}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8126977416910518, "4": 0.13992368669875777, "3": 0.04248630033818329, "2": 0.004890430219096384, "1": 1.302161476472101e-06}, "score": 4.760427084217889}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9888250518409355, "2": 0.008656913748561439, "4": 0.0012117702160832368, "5": 0.0009330693777694293, "3": 0.00037265518607070453}, "score": 1.0167698213295389}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6447158963482629, "2": 0.34828673058359955, "3": 0.0066251915123707854, "4": 0.0003550477395232035, "5": 1.699794676044089e-05}, "score": 1.3626702978897782}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8923448606856981, "2": 0.10756545854836615, "3": 8.90462197499969e-05, "4": 4.43270342092262e-07, "5": 7.442529249414194e-08}, "score": 1.1077451910901475}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7608262235168579, "4": 0.23812855597126728, "3": 0.0010054812463445913, "2": 3.4313317974955545e-05, "1": 4.899982128986286e-06}, "score": 4.759737815284001}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997397708854714, "4": 0.0002582214520313576, "3": 9.404399869219007e-07, "1": 0, "2": 0}, "score": 4.999739897390408}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9434067096091657, "4": 0.05646502833451132, "3": 7.334486959450636e-05, "1": 5.1732569697197036e-05, "2": 2.5088752821650437e-06}, "score": 4.943173786621821}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7555397533928369, "5": 0.2414057865042875, "3": 0.002982979338171492, "2": 5.693154367795136e-05, "1": 1.3775360950024902e-05}, "score": 4.23826780238185}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.965332886523729, "4": 0.03463955991156854, "3": 2.725798642440053e-05, "2": 9.7476160161933e-08, "1": 0}, "score": 4.965305624814073}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.599856601398291, "2": 0.38774740476904335, "3": 0.009037271277300758, "4": 0.0030964050552911627, "5": 0.0002621285567306766}, "score": 1.4161597553470564}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9275876477903091, "4": 0.07126084933906646, "3": 0.00111746628718358, "2": 3.354455509391881e-05, "1": 0}, "score": 4.926403548209743}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4845981927359903, "3": 0.3512723255743619, "2": 0.1527522272533612, "5": 0.010917535728718727, "1": 0.00045943274155233534}, "score": 3.3527622723349833}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5257983735382017, "4": 0.2994035050953018, "5": 0.16631608078729085, "3": 0.008472581798002646, "1": 8.61336923135236e-06}, "score": 3.106220156193011}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9981043355458125, "3": 0.0015751464923719318, "4": 0.00022608579654577167, "1": 9.389438229538081e-05, "5": 4.5336785456859727e-07}, "score": 2.0019347839700568}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9998417658603422, "3": 7.622119380651363e-05, "1": 7.471505101324648e-05, "4": 6.632776918853952e-06, "5": 5.901181888637435e-07}, "score": 2.000016542052439}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9950365617711504, "3": 0.003870239064793199, "1": 0.000758307941154355, "4": 0.0003224820765055073, "5": 1.23518772795599e-05}, "score": 2.0037939511257643}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5952045208368982, "1": 0.2912087543780666, "3": 0.058430112326862654, "5": 0.03152970063747669, "2": 0.02362488200764971}, "score": 3.0522216373482296}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8789982783017141, "4": 0.1196900612928886, "5": 0.0008391014005331194, "2": 0.00047206965930252337, "1": 0}, "score": 3.1208962535946974}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4708380627035462, "2": 0.16523116261511792, "5": 0.15397420355236527, "3": 0.15022331880570064, "1": 0.059730553833338744}, "score": 3.4940955328383017}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4268459942559929, "2": 0.36172786645011373, "3": 0.1981931338934263, "5": 0.013209302007957759, "1": 2.3540328529643165e-05}, "score": 3.091489666083404}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4821685679664364, "2": 0.3110870818651497, "5": 0.15058574843499029, "3": 0.055340376569137796, "1": 0.0008181155272309932}, "score": 3.470616803513846}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9971650343262726, "4": 0.0010788901555215038, "3": 0.001058062895257102, "5": 0.0006962916138242844, "1": 1.6394733430315828e-06}, "score": 2.0053030790068203}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.989527359993401, "5": 0.008318910352280173, "4": 0.0019772901159715926, "3": 0.00017542657125822417, "1": 9.042707673472398e-07}, "score": 2.0290858367507982}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8084532215149981, "1": 0.1301162496543411, "3": 0.05886900251175438, "4": 0.002500306386542963, "5": 6.104367294761333e-05}, "score": 1.9339364850050256}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.554934749841776, "5": 0.4386112208466068, "3": 0.006170967168165569, "2": 0.00017739299072542806, "1": 0.0001032281469851512}, "score": 4.431776837225773}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9798794843819879, "4": 0.018538061166760177, "1": 0.0010141038123602727, "3": 0.000290304553952569, "2": 0.0002765015862855714}, "score": 4.975995372641924}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9176976499175437, "4": 0.05749334942742222, "1": 0.02451171775633698, "3": 0.000217289281007903, "2": 7.446815303596497e-05}, "score": 4.843800933453685}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5999365376160596, "5": 0.3488416446530871, "4": 0.047418681663840154, "2": 0.002129136032693448, "3": 0.001669585311259877}, "score": 2.5430977426082704}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8835427546794452, "3": 0.08485865406386117, "1": 0.02185853097503222, "4": 0.00969324526965393, "5": 4.670744425988278e-05}, "score": 2.082526744838132}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7200207989202735, "5": 0.24279216249316038, "2": 0.021894723659010424, "3": 0.015183980824359662, "1": 0.00010603630738496259}, "score": 4.183501047076563}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7092343436869902, "3": 0.22624174121171417, "2": 0.062098577307948884, "5": 0.002367650892458673, "1": 5.767810033976646e-05}, "score": 3.651755717699087}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.47367592199209574, "2": 0.3051923943800921, "1": 0.11067765627215384, "5": 0.06078509306034891, "3": 0.04966635186566878}, "score": 3.0686985785976386}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7425938269694558, "5": 0.14244305117903436, "2": 0.09428963599458673, "3": 0.020666870908182425, "1": 6.196450065343348e-06}, "score": 3.9331782909666853}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9057508778596207, "1": 0.09163257942126474, "3": 0.002603559322364035, "4": 1.2581953909908827e-05, "5": 3.030166749842438e-07}, "score": 1.910997044098724}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6149237761970288, "4": 0.3172464380599748, "2": 0.06726204962301369, "5": 0.0005668867554625428, "1": 5.521257547718004e-07}, "score": 3.2511171323381234}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9637920012410087, "3": 0.02234334198646964, "1": 0.01380172078537929, "4": 6.252056595929731e-05, "5": 3.0891520969049393e-07}, "score": 2.0086675900017883}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4711035112514754, "4": 0.46754078192214515, "2": 0.057951553613755494, "5": 0.003197452116233348, "1": 0.00020568041033337516}, "score": 3.4155731958899564}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5926542513643188, "3": 0.4000534563213167, "2": 0.005582255906337035, "5": 0.0017038918856097569, "1": 5.831233511293666e-06}, "score": 3.5904683017493473}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7018216268848386, "1": 0.2890043323938178, "3": 0.008815257076759815, "4": 0.00033245036074694694, "5": 2.610522688219731e-05}, "score": 1.7205540773554968}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7253808149712239, "4": 0.264871996968548, "1": 0.007078581814694053, "3": 0.002208974938030213, "2": 0.0004555687133781469}, "score": 4.701027805153799}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7190479166633197, "4": 0.27854161647180253, "3": 0.0019150860933445524, "2": 0.00032046259393696784, "1": 0.00015664099923826715}, "score": 4.716035069485061}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.640146027939154, "5": 0.35526208297023215, "3": 0.004573884203252997, "2": 1.534932590314385e-05, "1": 0}, "score": 4.350658431310187}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8943198622926767, "5": 0.10461299498809727, "4": 0.0009980342136759522, "3": 4.944804675841197e-05, "2": 1.766136627969312e-05}, "score": 1.4215634827976151}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9599389790788775, "3": 0.03390344321464672, "4": 0.005939759111793615, "1": 0.00017206986014142457, "5": 4.565346729131879e-05}, "score": 2.0457478563382385}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9999784691637917, "2": 2.139832307474662e-05, "3": 3.5307020915264885e-08, "5": 8.361274243445507e-09, "4": 0}, "score": 1.000021502384124}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9764793146928591, "4": 0.01739267218949781, "3": 0.0059129329596342315, "5": 0.0002062369102949692, "1": 8.709283780888597e-06}, "score": 2.0413082843195536}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8866014191562075, "3": 0.08648810404440585, "2": 0.01745354498435782, "5": 0.009456137286215322, "1": 5.841435964561865e-07}, "score": 3.8880591672916083}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9001210497318902, "4": 0.06216475995511735, "3": 0.03717511474586735, "5": 0.000537232820331462, "1": 1.8253916339620496e-06}, "score": 2.163114510556341}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.713990729942961, "1": 0.26244015602205933, "3": 0.022437500285711037, "4": 0.0009828475856913696, "5": 0.00014865356890936496}, "score": 1.7624089733902797}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.684071099584987, "5": 0.3038536220353628, "3": 0.011812889655468464, "2": 0.00024785268509694723, "1": 1.3416262063235704e-05}, "score": 4.291505104644228}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.42018765494538, "3": 0.3861275359782448, "4": 0.1563844156527091, "1": 0.031482167643654954, "5": 0.005817931458017052}, "score": 2.684868195585832}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5335712314010992, "4": 0.45716481847018775, "2": 0.006971866496711665, "5": 0.0022849000440295112, "1": 0}, "score": 3.4547660189132388}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9883208381298599, "4": 0.011658322224097656, "3": 2.0115276634697357e-05, "2": 1.291814282661662e-07, "1": 0}, "score": 4.988301052715275}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5291357837520195, "3": 0.3923437932324301, "4": 0.07825696843848026, "5": 0.0002499471656092392, "1": 1.33042902442098e-05}, "score": 2.5495943789502524}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.542275719134367, "4": 0.4500960385447639, "3": 0.007618713923282854, "2": 8.617918291152626e-06, "1": 2.135390749886317e-07}, "score": 4.534639501369049}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8929853889478673, "3": 0.06188322114063232, "5": 0.04406637760053402, "2": 0.0010637285955194295, "1": 9.201804912536862e-07}, "score": 3.9800529314759325}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9635547516026456, "5": 0.03642383175609883, "3": 4.217930301954494e-06, "1": 0, "2": 0}, "score": 4.036420240206981}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.698951936139613, "4": 0.3004824588265538, "3": 0.0005615788310288833, "2": 2.3497913993081855e-06, "1": 0}, "score": 4.69838682850943}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9393091600810446, "2": 0.06059244885645544, "3": 9.423272853941201e-05, "4": 2.8131660519491337e-06, "5": 1.2364032476418652e-06}, "score": 1.0607943060369527}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8566055883060507, "4": 0.11901316044626863, "2": 0.01713710642630027, "5": 0.0072273416043788915, "1": 1.4897844796575856e-05}, "score": 3.116301163136137}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3614085655793021, "3": 0.2284323896905386, "2": 0.22413632914543935, "5": 0.18585702196174694, "1": 0.00016238232051283774}, "score": 3.5086632000540376}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6644363312111562, "5": 0.18269960091022264, "4": 0.13479596691226411, "3": 0.018022242310469918, "1": 4.2062582045481736e-05}, "score": 2.835674088564168}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5911274106233629, "5": 0.3716833674212012, "3": 0.03629263684579975, "2": 0.0008845978703546438, "1": 8.158232645565314e-06}, "score": 4.333598337487004}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7587717131623226, "3": 0.14314662849045554, "1": 0.07880227594378919, "4": 0.019093916548066178, "5": 0.00018510394977717145}, "score": 2.103087534800085}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8028923851651047, "1": 0.16307018304763743, "3": 0.03114018411816982, "4": 0.0028605662049095326, "5": 3.59562728802207e-05}, "score": 1.8738989108515796}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.986265647791132, "4": 0.013556908624567323, "3": 0.0001767290127470162, "2": 2.2882919158050164e-07, "1": 0}, "score": 4.986088940105172}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999762043451211, "3": 1.7157434152448687e-05, "4": 3.7011277035806676e-06, "1": 2.484634479447953e-06, "5": 2.203959798674148e-07}, "score": 2.000022736248296}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8567241421565608, "3": 0.08115800868465985, "5": 0.06150363501385557, "2": 0.0006111977508565706, "1": 0}, "score": 3.9791231678547296}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.848407327061441, "4": 0.14525229253517122, "3": 0.006182037928369168, "2": 0.00015545954825911193, "1": 2.6120009051889895e-06}, "score": 4.841906762128148}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995269016763211, "4": 0.00044610495879934814, "1": 2.1585257488069045e-05, "3": 2.7876015258826135e-06, "2": 0}, "score": 4.999461977398306}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6473366792778514, "5": 0.260387909556557, "3": 0.09145792943783684, "2": 0.0008153627921729634, "1": 1.536824935538499e-06}, "score": 4.167294741443618}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5324768800966521, "4": 0.45565492471003977, "3": 0.01158910090157297, "2": 0.0002765123700577185, "1": 2.147242708595721e-06}, "score": 4.52032853890271}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9968533840057611, "4": 0.003141081850581339, "3": 3.718348276407589e-06, "1": 0, "2": 0}, "score": 4.996851475735791}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7748862923047024, "4": 0.2248425049222769, "3": 0.00026850393194691245, "2": 2.4349264675916624e-06, "1": 0}, "score": 4.774613122951538}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9936954178062919, "4": 0.006301888050042096, "3": 1.8345781387997235e-06, "1": 0, "2": 0}, "score": 4.9936944373736365}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998585673825358, "4": 0.00013902441399565724, "3": 1.787647586343575e-06, "1": 0, "2": 0}, "score": 4.999857400202342}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6966741159481614, "5": 0.25339123532307906, "4": 0.04414177349932527, "2": 0.004970787503585733, "3": 0.0008186253720046147}, "score": 2.152602290754859}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9978296152983498, "4": 0.0021675712020479718, "1": 0, "2": 0, "3": 0}, "score": 4.997832422699474}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"1": 0.39009686457196274, "4": 0.30272490202055913, "5": 0.12485736165473368, "3": 0.10298653782734205, "2": 0.07933086562736305}, "score": 2.692913965492847}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4687338995097247, "2": 0.23304563178981602, "3": 0.18677087140672002, "5": 0.06679416183089731, "1": 0.044653999553723095}, "score": 3.2799689942842893}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4526057461477259, "5": 0.24844256175035215, "2": 0.2479384125871171, "3": 0.04233061905746574, "1": 0.00867729877308957}, "score": 3.6842015279876907}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7302359630607693, "1": 0.26050875758116476, "4": 0.009138856598261934, "3": 6.812457796562869e-05, "2": 4.3936506513766816e-05}, "score": 3.948553468333213}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9028821441270348, "4": 0.08169311928015299, "3": 0.01026703091054726, "5": 0.00514877220255962, "1": 8.425143914769423e-06}, "score": 2.189091257056471}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8971996826927905, "3": 0.06664468369865924, "5": 0.03567185416092525, "2": 0.0004829168849346293, "1": 6.730622602937546e-07}, "score": 3.968059311452842}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6267764255553079, "3": 0.3088409066139744, "4": 0.061836189209053476, "1": 0.0023158194036741425, "5": 0.00023066848686790884}, "score": 2.4308894670951497}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.997043912057645, "4": 0.0017881650440055438, "3": 0.001155460284125245, "2": 9.698668014274153e-06, "1": 0}, "score": 4.995871806973598}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8252563199940508, "5": 0.17473701618483953, "3": 2.5972717260761345e-06, "1": 0, "2": 0}, "score": 4.174735129482146}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9507610641073373, "5": 0.04923476004309732, "3": 2.1209361214935847e-06, "1": 0, "2": 0}, "score": 4.049232740275996}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"2": 0.46235790577104763, "3": 0.3737096574635601, "4": 0.15210638524896347, "1": 0.008448277538408839, "5": 0.0033736130070475727}, "score": 2.6795978172310115}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.98500266030149, "2": 0.013967584875600951, "3": 0.0007033123884926661, "4": 0.00029749861156437037, "5": 2.8338932273821433e-05}, "score": 1.0163800711245252}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9829076975225912, "4": 0.016972289402936415, "3": 0.00010200793026562431, "1": 8.770190763432895e-06, "2": 7.773477025894808e-06}, "score": 4.982765268354247}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9979540176810697, "1": 0.0011794964132834174, "4": 0.00033834093074658144, "3": 0.0002735251456798423, "5": 0.0002544146860450521}, "score": 2.000533954761562}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6363167977421381, "4": 0.35959542461703575, "3": 0.0020455102696524856, "2": 0.002025616054998428, "1": 1.3694654277502087e-05}, "score": 4.63018083463132}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6226892691679551, "2": 0.2096812622704771, "4": 0.16558482130800253, "5": 0.002015187572150543, "1": 2.9328289376900776e-05}, "score": 2.959875272331003}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9070389463885203, "1": 0.07130719820969167, "3": 0.02157011903612218, "4": 8.025307330916769e-05, "5": 3.322652992550163e-06}, "score": 1.9504333869696775}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.6611532832653699, "1": 0.17435214553997547, "3": 0.1338273824678949, "4": 0.030443493068298518, "5": 0.0002226928700843393}, "score": 2.0210303227637323}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8816645977129293, "4": 0.11831387835014406, "3": 1.821483838819771e-05, "1": 0, "2": 0}, "score": 4.881649300338953}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8857951577813692, "3": 0.07732806680209578, "5": 0.030980422693799588, "2": 0.005617716580735148, "1": 0.0002764150548319429}, "score": 3.9415875478265896}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8524075853347921, "3": 0.06633845731196805, "1": 0.05499409847287268, "4": 0.025672818312523705, "5": 0.00058606667206745}, "score": 2.0644482582462316}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.9415784310498041, "2": 0.03656826833523862, "4": 0.021730792827293795, "1": 6.343365508896677e-05, "5": 5.902030622308276e-05}, "score": 2.985153696995201}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9282204876189946, "5": 0.07140486319366643, "4": 0.0003715542406584038, "2": 2.507302710415889e-06, "1": 0}, "score": 3.143178857463473}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9564270850557305, "5": 0.04105490343142053, "3": 0.002515581221858002, "1": 0, "2": 0}, "score": 4.038539415871558}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9958321303778302, "4": 0.003997216640284861, "5": 0.0001277306254837933, "2": 4.194056755649179e-05, "1": 8.221664240788035e-07}, "score": 3.004209093662714}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7850479659071593, "1": 0.18418391178326501, "3": 0.02895911127365236, "4": 0.001723714023742279, "5": 8.536972740907886e-05}, "score": 1.8484787477380014}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9659310153507586, "2": 0.03404460167743735, "3": 2.3834200809342684e-05, "4": 3.5545328599792215e-07, "5": 8.63225478584218e-08}, "score": 1.0340936853769647}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987366352180719, "3": 0.0007034997758718513, "4": 0.0005575660981242669, "2": 4.862723398173523e-07, "1": 0}, "score": 4.99803397196942}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5506849015074161, "4": 0.185828253521482, "3": 0.1287094166001889, "1": 0.12837768444346884, "5": 0.006399269728812588}, "score": 2.3911862338860983}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5953792390024004, "4": 0.3621918265178125, "2": 0.03675068551602452, "5": 0.005670879832501026, "1": 6.2441033722181085e-06}, "score": 3.3367707913365776}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5683081157678597, "5": 0.3593296021005209, "3": 0.05642563513909113, "2": 0.015501949325948736, "1": 0.00043373127398675}, "score": 4.270599135992573}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9066029106216591, "2": 0.06504504168921511, "4": 0.010237958955395053, "5": 0.009504061931704784, "3": 0.008606914389306252}, "score": 1.1509894650023633}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9954568091564534, "4": 0.004530877724899232, "3": 1.1344505819528253e-05, "2": 1.6095387559415687e-07, "1": 0}, "score": 4.995445946723713}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.67018329458782, "4": 0.3268992040818386, "3": 0.0028197538079177387, "2": 9.175725505379375e-05, "1": 0}, "score": 4.667184022880476}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6319234598510767, "5": 0.30002754256202463, "3": 0.04701888262389424, "2": 0.017979909200126425, "1": 0.003047530464817735}, "score": 4.2079068063561005}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9700790829437611, "2": 0.029388036770997036, "3": 0.0004733057369287142, "4": 4.3287008613293375e-05, "5": 1.6000821392675108e-05}, "score": 1.0305285213093511}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7772775384889766, "5": 0.20173151486401442, "3": 0.016944899582924847, "2": 0.004001298682225304, "1": 4.338364635353394e-05}, "score": 4.176654108063711}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5162035833167504, "4": 0.4571496408501644, "3": 0.02297687967864828, "2": 0.0036535024359098333, "1": 1.565785265074847e-05}, "score": 4.485873082745753}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5547896977600562, "5": 0.4399802673532128, "3": 0.00518019644336647, "2": 4.4578316245489986e-05, "1": 0}, "score": 4.434713200924053}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.48163388415393804, "4": 0.45844887427109304, "2": 0.04973034842230607, "5": 0.00950885318621308, "1": 0.00067703363761584}, "score": 3.4263825940270802}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6456611683498035, "5": 0.3507962529442376, "3": 0.0034588400215843653, "2": 8.291645693699137e-05, "1": 2.1316570839845437e-07}, "score": 4.347171151960316}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6313186195896602, "1": 0.19381542312571068, "3": 0.12621026412140715, "4": 0.04814482130004839, "5": 0.0005094489024135627}, "score": 2.0302128732947673}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.606944545752288, "5": 0.33778458809431994, "2": 0.0447749476596389, "4": 0.009702046852614839, "3": 0.0007916928951473579}, "score": 2.4266059345970183}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7721428401280267, "4": 0.13676368083703452, "2": 0.06548827238035755, "1": 0.023137270964930436, "3": 0.002463662044456619}, "score": 4.56929325338544}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9928353351668386, "4": 0.007154147646815126, "3": 7.548807154250673e-06, "2": 2.0623861773373333e-07, "1": 0}, "score": 4.992830116218796}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9960698062072726, "4": 0.003921182549038999, "2": 5.961842382950936e-06, "3": 2.8518718209161627e-06, "1": 0}, "score": 4.996055227400961}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8507247463724757, "4": 0.14859367671393317, "3": 0.000673047938366319, "2": 7.0913700438634e-06, "1": 0}, "score": 4.850038737714116}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.623022652813116, "4": 0.2880353394357127, "2": 0.07399942174982886, "3": 0.014647927809120111, "1": 0.0002925830499910433}, "score": 4.459499085880323}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9997098663169197, "1": 0.0002780749156004074, "3": 1.0625115209133675e-05, "4": 1.0169526504953982e-06, "5": 2.076441582376565e-07}, "score": 1.9997352069820282}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9998567795870227, "5": 7.402934420883572e-05, "4": 5.3342775843708755e-05, "2": 1.5469580666261155e-05, "1": 0}, "score": 3.00018593195401}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8850716825700626, "3": 0.1001074870253461, "4": 0.008265202889306343, "1": 0.006519073593665431, "5": 3.647100487699392e-05}, "score": 2.110228241364691}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6764202868644161, "3": 0.18802869402614156, "5": 0.06795027440881377, "2": 0.06475678475700303, "1": 0.0028433651963221977}, "score": 3.7418777617621948}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6074275683070428, "3": 0.2220529526726671, "2": 0.11288179158209131, "5": 0.04560941109927333, "1": 0.012024380283427812}, "score": 3.561718026841249}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9738966595433213, "4": 0.01935105575524828, "5": 0.003743375254783342, "3": 0.002300059009665149, "1": 0.0007082935015222979}, "score": 2.0515240314785492}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9993619879163205, "5": 0.0006074091143195665, "3": 2.7443725372988307e-05, "2": 2.578909300911713e-06, "1": 0}, "score": 4.000574807903925}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"2": 0.48573360170876717, "3": 0.40016827613581035, "4": 0.11132934485176627, "1": 0.0022358971993324565, "5": 0.0005326699267597261}, "score": 2.6221892091905024}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7766534487594329, "1": 0.1569292362128002, "3": 0.06337684532122635, "4": 0.0029987552292559056, "5": 4.140768774700377e-05}, "score": 1.9125693158073602}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.858538039814135, "4": 0.07345688819677729, "2": 0.04057564780863994, "5": 0.018533673726955982, "3": 0.008894296947989025}, "score": 1.3528701141014263}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.992818187658712, "4": 0.007178009232756685, "3": 2.7069121520534807e-06, "1": 3.5202839393973817e-07, "2": 0}, "score": 4.992815163482638}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9947951290263377, "5": 0.003857170867943748, "4": 0.0007406410225885142, "2": 0.0004627322337538676, "3": 0.00014399096549133413}, "score": 1.0184013268849863}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5731382313000912, "5": 0.4261802074407633, "3": 0.0006790043662594261, "2": 1.8205043133720542e-06, "1": 0}, "score": 4.4254978753976495}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.924638355448473, "3": 0.06545318007194048, "1": 0.00792291567595206, "4": 0.0019717555321194747, "5": 1.380941433781873e-05}, "score": 2.061515202710212}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5370472497407386, "4": 0.426326454957263, "5": 0.03657636544616515, "2": 4.8152668533468726e-05, "1": 0}, "score": 3.4994319207651263}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8295639729689288, "5": 0.12063081659607035, "3": 0.04456437526544574, "2": 0.005221771326865537, "1": 1.865235773047791e-05}, "score": 4.065566968583524}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5532117164528286, "3": 0.4161263245641644, "4": 0.026383169264421254, "1": 0.004176359270059409, "5": 0.00010229722617379103}, "score": 2.465023257452961}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9559326100451073, "3": 0.0313238340488147, "1": 0.012075930770151438, "4": 0.0006627126967048377, "5": 4.713918700465947e-06}, "score": 2.02058747451521}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5933703136084162, "3": 0.32101882908074336, "2": 0.07917256830052792, "5": 0.0033713952484130966, "1": 0.0030551692100113776}, "score": 3.514836233608827}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6951653833993932, "3": 0.16291952691390452, "5": 0.08942830823507046, "2": 0.03652302117824521, "1": 0.015950734510444847}, "score": 3.805608003329275}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9608181422047638, "4": 0.03915935235064009, "3": 1.8362445214907036e-05, "1": 0, "2": 0}, "score": 4.9608037603689334}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6310069892729311, "4": 0.3653785644517335, "3": 0.0035587354780948297, "2": 4.682037905164307e-05, "1": 0}, "score": 4.627360190531181}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5484757015860912, "5": 0.4004155884924851, "4": 0.05090606537251993, "2": 0.00019944241697794022, "1": 0}, "score": 3.851540526685619}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9875529286601759, "2": 0.01243945130448964, "3": 7.2693331274527785e-06, "4": 1.5984375980807834e-07, "5": 6.44690224890224e-08}, "score": 1.0124547289522599}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997296412535144, "4": 0.0002044158824223588, "3": 6.545949523276671e-05, "1": 0, "2": 0}, "score": 4.999664664965022}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5586564915444534, "4": 0.4163993513497922, "5": 0.024938467203036663, "2": 3.0239640135466153e-06, "1": 0}, "score": 3.4662745048511012}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.729568781245909, "4": 0.2701668359192514, "3": 0.00025892192230351677, "2": 1.3122989961488483e-06, "1": 0}, "score": 4.729310260352034}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6454116427107167, "2": 0.35164258596977294, "3": 0.002891238563447969, "4": 4.6559662652655335e-05, "5": 7.744683112802106e-06}, "score": 1.3575958024956416}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9784822943455581, "1": 0.013897665536007442, "3": 0.00697270107908008, "4": 0.0006344487793963651, "5": 1.2649586893048412e-05}, "score": 1.9943818805104143}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9990155496894662, "4": 0.0009828146608487434, "3": 7.611678030813312e-07, "1": 0, "2": 0}, "score": 4.999015662142759}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6674405342113927, "2": 0.3202158113602979, "3": 0.011357324645309816, "4": 0.0008722736190157743, "5": 0.00011323333010231598}, "score": 1.346000499529308}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9809804551595576, "2": 0.008729156802433618, "4": 0.0045270380746218, "3": 0.0038242955446446234, "5": 0.0019368429051281587}, "score": 1.0377063171241345}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7477242415569203, "3": 0.1806747546097471, "5": 0.03761068851376306, "2": 0.033948170992253175, "1": 4.11368189206336e-05}, "score": 3.7889159687938143}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4722212090232591, "3": 0.3709562083997249, "4": 0.13976868120433522, "5": 0.0106370541394108, "1": 0.006416172646732211}, "score": 2.675989016592985}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9928207660108933, "4": 0.007157235327643959, "3": 2.1113751498059795e-05, "2": 2.5470495522676814e-07, "1": 0}, "score": 4.992799768516871}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5686719038825329, "5": 0.2368760193097707, "3": 0.18926545983269405, "2": 0.005185847491657837, "1": 0}, "score": 4.03723889314847}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5925285271756429, "3": 0.3885007650250212, "5": 0.018859109862517553, "2": 0.00010855072312342776, "1": 0}, "score": 3.6301401163491467}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.674108474247107, "3": 0.3102098112351097, "4": 0.014211292271723826, "1": 0.0012043788766432425, "5": 0.00026605220740522756}, "score": 2.3382261705348903}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7805285504524713, "3": 0.20534783122376726, "5": 0.013234922486843152, "2": 0.0008878234076565971, "1": 0}, "score": 3.806111275293566}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9857002132175232, "4": 0.01006527397192542, "2": 0.0032904070449120766, "5": 0.0009432605636289544, "1": 4.3484986646221084e-07}, "score": 3.008660521908402}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5128831692507839, "5": 0.46963921815343074, "3": 0.016672253639920562, "2": 0.0006930343450816821, "1": 0.00011108309867821135}, "score": 4.451248206757423}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8174415477420744, "5": 0.17618427757908797, "3": 0.006300869747214297, "2": 7.246991845992415e-05, "1": 0}, "score": 4.1697386097289275}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3488483773617994, "5": 0.2950428732946384, "1": 0.2529915221764637, "2": 0.06364220042365892, "3": 0.039469340434473255}, "score": 3.3693109791908222}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9805651253507294, "3": 0.017825659763262405, "4": 0.001602312469067707, "2": 1.3982627286698564e-06, "1": 0}, "score": 4.962741968142268}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.620673686330443, "4": 0.3312546049640731, "3": 0.04674190468779805, "2": 0.0013288292334766652, "1": 0}, "score": 4.571274680045228}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.908563561924467, "4": 0.09139702045627984, "3": 3.712481292170869e-05, "2": 5.154461503265769e-07, "1": 0}, "score": 4.908527020998996}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9829296972088747, "5": 0.016839847938314938, "4": 0.00017784876564877413, "3": 2.655626150107062e-05, "2": 2.579788619034451e-05}, "score": 1.0679718655841943}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"2": 0.812811055909149, "3": 0.1218670844348774, "1": 0.0418942078114528, "4": 0.021783357895798525, "5": 0.0016440361393775698}, "score": 2.1284717339543673}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6914140435099972, "4": 0.2987196412938712, "3": 0.009498421994641059, "2": 0.00035887263843910333, "1": 8.83119692888247e-06}, "score": 4.681171511638499}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9940632972768889, "4": 0.005889365571137334, "3": 4.645181589161443e-05, "2": 3.5103075367887024e-07, "1": 0}, "score": 4.994016674507897}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7383967184052085, "4": 0.2581113236780743, "3": 0.001752289080138326, "2": 0.0017270716371307242, "1": 1.1358763470768224e-05}, "score": 4.733157117728548}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4262976362629907, "5": 0.3218550789886927, "2": 0.22761472089978385, "3": 0.02422478491215343, "1": 6.656604754660273e-06}, "score": 3.8423807055615886}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4904601043411597, "5": 0.4006929723205815, "3": 0.1062530888575193, "2": 0.0025244047162252823, "1": 6.93824225436979e-05}, "score": 4.289182940453471}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8854561261197607, "4": 0.11194383574790488, "3": 0.002435454224520084, "2": 0.00014612765046442678, "1": 1.8052398520342187e-05}, "score": 4.882674615874688}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6512389847950137, "5": 0.19148381325835442, "3": 0.1486929109732175, "2": 0.008548469653059327, "1": 3.5059953667230354e-05}, "score": 4.0255888026004785}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.752068273443344, "4": 0.24773347705602147, "3": 0.00017642688794767826, "2": 1.7986015836175457e-05, "1": 2.0453247072961033e-06}, "score": 4.751851085319506}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.583294870028869, "5": 0.37320119797726226, "3": 0.04060890911975249, "2": 0.002875923899525564, "1": 1.8882197707922943e-05}, "score": 4.326783865304522}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"1": 0.44401359395626, "5": 0.29128785741746216, "4": 0.2205918318103255, "2": 0.027171463294530147, "3": 0.016930204563667846}, "score": 2.88796832979503}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959339259557018, "4": 0.003976232563788014, "1": 7.975126135984577e-05, "3": 7.329223369487491e-06, "2": 1.978916668723967e-06}, "score": 4.995684163818702}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7112227194921557, "1": 0.26390109135354406, "4": 0.01677133667504341, "2": 0.007701004531462444, "3": 0.0003995950095026369}, "score": 3.9037174318752754}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7661334252579748, "4": 0.23306152604389194, "3": 0.0006660119131308547, "2": 7.251428362437724e-05, "1": 5.376617532229402e-05}, "score": 4.765170847020442}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955497846845534, "4": 0.004447624257877778, "3": 1.0126154700241458e-06, "1": 0, "2": 0}, "score": 4.995550343487657}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9992246194230001, "3": 0.0004119586408253633, "4": 0.00035868058532334925, "5": 3.7680120623299004e-06, "1": 7.382362069038496e-07}, "score": 2.001139885879442}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5401737672412482, "4": 0.18087724178415704, "1": 0.11430851660240515, "5": 0.10916093693980157, "3": 0.05547846785970613}, "score": 2.6304079199121095}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6331616868447048, "5": 0.3459039650879209, "3": 0.013766138968553554, "2": 0.0068703309547493655, "1": 0.0002974920666669102}, "score": 4.3175048105913}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9999083813732428, "4": 4.339006760835537e-05, "5": 2.366543531235615e-05, "2": 1.9858409264746643e-05, "3": 3.438947818778033e-06}, "score": 1.000251568567404}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9996082495542522, "1": 0.0003887068878662664, "3": 1.4112030364736754e-06, "5": 1.271110029839431e-06, "4": 2.432558662586171e-07}, "score": 1.9996170041118033}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9345121645465259, "2": 0.06514367915468874, "3": 0.000337143129891516, "4": 6.567239376473663e-06, "5": 3.839770698783848e-07}, "score": 1.0658392071197809}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5061331004080853, "2": 0.49192712174313086, "3": 0.001922646608873529, "4": 1.3676192644053215e-05, "5": 3.4099668095023004e-06}, "score": 1.4958271057581605}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8304885723394809, "3": 0.12704219545861023, "1": 0.04174443207717176, "4": 0.0006791816095282597, "5": 4.562425842008819e-05}, "score": 2.086792998877284}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8695907241785713, "5": 0.09732821036533519, "3": 0.03293888513929002, "2": 0.00014156649810519983, "1": 0}, "score": 4.064106231579438}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8194132365874696, "1": 0.17923379644322235, "4": 0.0006798971644366348, "3": 0.0006641118326524458, "5": 8.77239235760303e-06}, "score": 1.822816394013667}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5871916628067585, "5": 0.40880148807258054, "2": 0.0027310932283469798, "3": 0.0012685655564102115, "1": 0}, "score": 4.402073627103913}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8584377941801812, "3": 0.10758554289429248, "5": 0.029088664987992965, "2": 0.004791974689532638, "1": 9.239561843274636e-05}, "score": 3.9116416653280295}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7568071148952582, "5": 0.18639410551579438, "4": 0.03631066424509014, "3": 0.020478600829842833, "1": 5.179572676396111e-06}, "score": 2.652279893889806}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9847180051366454, "4": 0.015255435701431974, "3": 2.454427324445929e-05, "2": 1.5986661910013156e-07, "1": 0}, "score": 4.984694967761049}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.56971938864277, "3": 0.19255123592873727, "5": 0.12846632130633442, "1": 0.06020199425840657, "2": 0.04905584185807123}, "score": 3.6571956301310857}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6802126085822889, "1": 0.3185235711365873, "3": 0.001249226523989729, "4": 1.4300844020894411e-05, "5": 3.0263693022354104e-07}, "score": 1.6827551680710655}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6517072832077632, "5": 0.33157700623433495, "3": 0.016564104573811696, "2": 0.00014942155777387153, "1": 1.5480848060922885e-06}, "score": 4.314709614553348}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5634076192138792, "3": 0.4160666854522036, "2": 0.01550601446997909, "5": 0.004946887440886339, "1": 7.219657145253659e-05}, "score": 3.55765131931785}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7016343707694628, "4": 0.2961108800611531, "3": 0.0022159514925060874, "2": 3.760317761883735e-05, "1": 0}, "score": 4.699344048287666}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996566101717876, "4": 0.0003428511054303748, "3": 1.5910459831143386e-07, "1": 0, "2": 0}, "score": 4.999656830555099}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9453118083367218, "5": 0.038578775934064675, "3": 0.01363378194011423, "2": 0.0024750895544498348, "1": 0}, "score": 4.019994825766928}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8715296611549679, "3": 0.11723325457252577, "1": 0.007285242152579719, "4": 0.0039381374337354915, "5": 1.3757285770049931e-05}, "score": 2.1178655529450485}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.945206681329916, "4": 0.053171246929062464, "3": 0.0012008900365314636, "2": 0.00023180524501152829, "1": 0.0001890889535355617}, "score": 4.942975185053723}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9327144506655837, "3": 0.06277611576890438, "4": 0.002347596359532772, "1": 0.0021409706029328207, "5": 2.0700535261164353e-05}, "score": 2.0653924503504}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9989810481843177, "2": 0.0009292493019355004, "4": 5.142312931724426e-05, "5": 3.3352660955999684e-05, "1": 4.826644752080186e-06}, "score": 2.9991792257776466}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4233447754249503, "4": 0.348768360722292, "2": 0.22181075846272255, "5": 0.005717292070126019, "1": 0.0003588196727466339}, "score": 3.1376745461797038}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9926497114754491, "4": 0.0067064957991981216, "3": 0.00035930210688561433, "5": 0.00027563473297656526, "1": 8.668576218298757e-06}, "score": 2.0145905320609354}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5441079577874421, "4": 0.43927264476231864, "3": 0.01422576815608422, "2": 0.002393037020130121, "1": 0}, "score": 4.525096426592071}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9998571371458695, "5": 8.08696466681405e-05, "3": 6.139224707012574e-05, "2": 2.111782021410924e-07, "1": 0}, "score": 4.000019055050622}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9232773011364668, "4": 0.07669124677521427, "3": 2.9713680360766387e-05, "2": 3.2237302473218963e-07, "1": 0}, "score": 4.923248250061831}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"4": 0.36365371375152733, "3": 0.35119294699889897, "2": 0.1226816856024029, "5": 0.10904877715663341, "1": 0.05342256803058701}, "score": 3.352224555048386}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6629186010591622, "1": 0.33374868812066577, "3": 0.0032589324713735855, "4": 6.488974234381293e-05, "5": 8.841261392808588e-06}, "score": 1.6696665319799155}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7485856146751579, "1": 0.12949055951472957, "3": 0.09933652011150516, "4": 0.021253731479332585, "5": 0.0013333282753834016}, "score": 2.0163534124036127}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7174445618842907, "5": 0.24798666609712083, "2": 0.02452171076893208, "3": 0.010046660381995365, "1": 0}, "score": 4.188896659899824}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992354549136463, "4": 0.0006356995575668826, "3": 0.00012802423193112388, "2": 1.9144409558602348e-07, "1": 0}, "score": 4.999107677084251}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5116125902612612, "2": 0.33849342863797616, "4": 0.1496079609427, "3": 0.0002819970353569607, "1": 2.091130979151734e-06}, "score": 3.834337142497745}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9427244790128133, "2": 0.05583569046459061, "3": 0.0011895877029522426, "4": 0.00020549168235608443, "5": 4.3853325672662166e-05}, "score": 1.0590068071972512}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9999717939237989, "3": 9.368842517757812e-06, "5": 8.581914793134372e-06, "2": 6.725582628640514e-06, "1": 0}, "score": 3.9999857618567614}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9992045081215623, "5": 0.0007342059374271187, "2": 4.786322948562082e-05, "4": 8.487466602427615e-06, "3": 3.948732170763171e-06}, "score": 1.0030180498206878}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9994779626589337, "4": 0.00038198175969013777, "3": 0.00011096474718757236, "5": 1.4237901918779371e-05, "1": 1.4193265023355374e-05}, "score": 2.0009034493032765}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6628652979175326, "4": 0.19630771036387706, "2": 0.1353175960709751, "5": 0.004333537915646889, "1": 0.0011757033673161154}, "score": 3.0673057937791994}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.4731167226513765, "2": 0.42584506331779537, "3": 0.07718367562083335, "4": 0.023315420809747522, "5": 0.0005364605128501003}, "score": 1.6523062522748269}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3848654832124973, "2": 0.3266173750745486, "4": 0.2860404627564418, "5": 0.002407224872879822, "1": 6.861200764452276e-05}, "score": 2.964100283182075}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981124077472681, "4": 0.0018868056727749307, "3": 2.7186791369860616e-07, "1": 0, "2": 0}, "score": 4.998112649619956}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8518766070904011, "3": 0.0948275974257587, "4": 0.044608118828914925, "1": 0.007801209446992513, "5": 0.0008859807805287066}, "score": 2.1789006550003633}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"4": 0.658535828510177, "5": 0.34034441118854775, "3": 0.0011146892638952274, "2": 2.7501255301509025e-06, "1": 0}, "score": 4.3392250089849345}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5884336517082221, "5": 0.4108023008675566, "3": 0.0007479759746182182, "2": 1.5517983201657965e-05, "1": 0}, "score": 4.410023515860774}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7969606133862093, "5": 0.1859257831907759, "3": 0.01681634414039765, "2": 0.00028941642211206006, "1": 0}, "score": 4.168531927978555}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.991216011644256, "4": 0.008781475790337832, "3": 6.354785498964035e-07, "1": 0, "2": 0}, "score": 4.991217236766552}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5767104835559428, "4": 0.4231828600860807, "3": 0.00010477849578746175, "2": 1.4254443047983497e-06, "1": 0}, "score": 4.576603115037107}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6091032228417164, "3": 0.2983585582966875, "5": 0.05079198563165571, "2": 0.04174139319313327, "1": 3.2249600351334615e-06}, "score": 3.6689404313819773}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9909143829359194, "4": 0.009063644292624162, "3": 2.1092585022069444e-05, "1": 0, "2": 0}, "score": 4.990894162522498}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9982377185447133, "5": 0.0017531056618286965, "2": 4.860535212920389e-06, "4": 4.101626317906167e-06, "1": 0}, "score": 3.003505453163639}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9843265167563944, "4": 0.01567102207169537, "3": 1.6805305682054065e-06, "1": 0, "2": 0}, "score": 4.9843256046310875}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9950068245528307, "5": 0.004092016903648075, "3": 0.000556043516327665, "4": 0.00034486162787832666, "1": 0}, "score": 2.013521820909449}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5984622382258107, "2": 0.25833285239381343, "4": 0.13857580147525667, "5": 0.0039024204115667986, "1": 0.000726570528377249}, "score": 2.8865946355833443}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8555172347770823, "4": 0.1433751725565907, "3": 0.001090493863035053, "2": 1.6328671624566173e-05, "1": 4.72817196452741e-07}, "score": 4.854392919142588}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9729454481399359, "4": 0.02604703075012538, "3": 0.0009977717651912436, "2": 9.32848906452637e-06, "1": 1.0531110108013792e-07}, "score": 4.971929010150245}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6598401567737775, "5": 0.220848948964012, "3": 0.11617583692900356, "2": 0.003122865403727899, "1": 1.1787793630337542e-05}, "score": 4.098392057610419}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7998222607988076, "4": 0.19820678987079457, "3": 0.00194978532930979, "2": 1.9789778320584137e-05, "1": 0}, "score": 4.7978339923144935}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3447532621463669, "4": 0.3340692407018822, "2": 0.23408960724069983, "5": 0.08229647527339726, "1": 0.00479075001732177}, "score": 3.254991253445705}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9974599110991688, "4": 0.002527479797949271, "3": 5.397870683651956e-06, "1": 1.1022533207627965e-06, "2": 0}, "score": 4.9974572999141}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9931403704078462, "1": 0.0036156497583742773, "4": 0.0030611436224860233, "2": 0.0001041872288475145, "3": 7.546594975963186e-05}, "score": 4.982012706503812}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8943941386415228, "4": 0.105161249215727, "3": 0.00041682241090695296, "2": 2.2578193655156936e-05, "1": 0}, "score": 4.893936818629174}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9692308084885943, "4": 0.030748763405300677, "3": 1.2801566649962262e-05, "1": 0, "2": 0}, "score": 4.969225398757689}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6692907361995102, "1": 0.3274504280815833, "3": 0.003105809155381379, "4": 0.00014644772780055535, "5": 6.62893102365843e-06}, "score": 1.6759681795549408}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.722854298966316, "4": 0.27554980123287626, "3": 0.0015826494012963802, "2": 1.1116367346339572e-05, "1": 0}, "score": 4.7212509560030655}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9889859269855985, "4": 0.00800643248308543, "5": 0.00243269885017404, "3": 0.0005741045703081229, "1": 7.676806581285708e-07}, "score": 2.0238843000646343}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8589130538417302, "5": 0.13977712348763435, "3": 0.0007511047764646181, "2": 0.0005563932664406435, "1": 0}, "score": 4.137913552775958}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8493255118231727, "3": 0.1261557656781191, "5": 0.023354191581322247, "2": 0.0011641434481775995, "1": 1.9305899908803307e-07}, "score": 3.894869539391416}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6065182259615557, "3": 0.2243631801779097, "2": 0.08556961703678645, "5": 0.08209944685506367, "1": 0.0014484721032520644}, "score": 3.6822512801584386}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6284385677257504, "3": 0.19995586735676202, "4": 0.1322810173520033, "1": 0.029426171898554086, "5": 0.009898130282811697}, "score": 2.46478623506181}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983492730509439, "4": 0.0016218107614147045, "1": 1.828917871625962e-05, "3": 6.36166132563745e-06, "2": 2.997364965800779e-06}, "score": 4.998283314929445}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6812135425224964, "1": 0.3147573671428725, "4": 0.0035245940939525825, "2": 0.00030293024302483065, "3": 0.0001992653907229538}, "score": 3.736135708169088}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9654282072334698, "1": 0.02386731808480613, "5": 0.008885591026538067, "4": 0.001230969018310838, "3": 0.0005875423085415932}, "score": 2.005838937513973}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9946270556775961, "2": 0.005371656204726705, "3": 1.245956562205548e-06, "4": 0, "5": 0}, "score": 1.0053741483444312}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6394453813350707, "3": 0.1710317101837902, "5": 0.16276935178258065, "2": 0.02664104253177576, "1": 0.00010473041349362599}, "score": 3.938140883798659}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8682342564762795, "1": 0.06975935119186452, "4": 0.06089987845993809, "3": 0.0007788449259580522, "2": 0.0003187434534176885}, "score": 4.657545739987491}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5327476921338158, "4": 0.2235766210922842, "2": 0.12381316295869935, "5": 0.08410390334005224, "3": 0.035683360189139486}, "score": 2.2024158541351238}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9570265356133097, "2": 0.042010256001353566, "4": 0.0006923617353374857, "5": 0.00017562228097306692, "3": 9.484477026535238e-05}, "score": 1.0449795369459656}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6540023724056127, "2": 0.3417757358984461, "3": 0.003870200362596064, "4": 0.0003052708935431697, "5": 4.537750773587875e-05}, "score": 1.3506138250016122}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8195196279142193, "1": 0.17409020405301245, "3": 0.006356213757829887, "4": 3.312795732192106e-05, "5": 8.757238810308681e-07}, "score": 1.8323349010748105}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9730872059153535, "3": 0.019750837173534146, "1": 0.005941688064725777, "4": 0.0011737740943321107, "5": 4.563265405601226e-05}, "score": 2.016293609306329}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9615387405320417, "3": 0.026123254090554705, "1": 0.01212029813555935, "4": 0.00021604798979077912, "5": 1.4678570645283095e-06}, "score": 2.01443945826941}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9131812798900354, "1": 0.07579637581074646, "3": 0.010779781313762057, "4": 0.00023594566794866252, "5": 6.09193982919499e-06}, "score": 1.935473538757638}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5811916815101588, "1": 0.21511209814680124, "3": 0.14661175625639533, "4": 0.054209381234864545, "5": 0.002874757373845261}, "score": 2.0485427085004395}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.962612900960547, "4": 0.017921807707293003, "5": 0.015003421558374964, "2": 0.0031850550689923327, "3": 0.0012756590907684864}, "score": 1.1195156207198356}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6543415082153129, "2": 0.21572418684507835, "4": 0.12751187263666422, "5": 0.0023975267351670814, "1": 1.5957621593680248e-05}, "score": 2.9165500773133153}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.908480704705966, "2": 0.06025982194883476, "5": 0.01893228714265031, "4": 0.008216548899354685, "3": 0.004109791424740707}, "score": 1.1688583429006156}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9924858732731728, "4": 0.00751152778855868, "3": 1.2120989884665412e-06, "1": 0, "2": 0}, "score": 4.992486037592805}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5177716572657056, "2": 0.4781486077184428, "3": 0.0039842798430388526, "4": 8.695820126416217e-05, "5": 8.224697829848803e-06}, "score": 1.4864110732365843}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7467215134391669, "2": 0.25042397438258335, "3": 0.0025405949324605603, "4": 0.0002127905945535754, "5": 0.00010112279373803817}, "score": 1.2565480281957506}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8895311347138054, "4": 0.10653134690555223, "3": 0.0025994372491926396, "2": 0.0012063399960135365, "1": 0.00013041798450479184}, "score": 4.884128933355093}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6937441128080153, "5": 0.15381253858092686, "3": 0.11529104749940904, "2": 0.03707129605730485, "1": 7.975764171596544e-05}, "score": 3.9641395813090208}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9656864957545689, "3": 0.02638015384050908, "4": 0.007686951484537699, "5": 0.00022344930341466237, "1": 2.2110631539047966e-05}, "score": 2.0424023296632257}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9943127335806174, "4": 0.005672748695284072, "3": 1.4210534531356684e-05, "1": 0, "2": 0}, "score": 4.994298828484312}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5442947821159118, "2": 0.28074918171701885, "4": 0.17233820925375046, "5": 0.001352585950377945, "1": 0.0012650263841305002}, "score": 2.891764123444101}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7489401688730459, "4": 0.24991507970615223, "3": 0.0011140781358895228, "2": 3.035819683461228e-05, "1": 0}, "score": 4.7477656099555166}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9442201068302929, "4": 0.05560593715851589, "3": 0.00015792694583426163, "2": 9.725006500773374e-06, "1": 0}, "score": 4.944048681209907}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9776356748046653, "4": 0.02234450163601138, "3": 1.7568395155093558e-05, "2": 2.0805838635731614e-06, "1": 0}, "score": 4.977614115913953}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7431513899795722, "1": 0.2477082838425015, "3": 0.008996496996714209, "4": 0.00013601410015392284, "5": 7.7462709355865e-06}, "score": 1.7615834637618564}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6812343539141129, "4": 0.3114079468993096, "3": 0.0031293592745548146, "1": 0.002933919607334207, "2": 0.0012937572462501253}, "score": 4.666716163396833}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9687693154348076, "2": 0.01543202474336007, "4": 0.00838954240931931, "5": 0.007396490115560573, "1": 1.2326390807254293e-05}, "score": 3.0077258474402213}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.566726587811269, "5": 0.29346485246073656, "1": 0.05790448709980486, "3": 0.04259173749649275, "2": 0.03930993472770054}, "score": 3.998539780704313}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9992010539275084, "5": 0.00044676148337595954, "2": 0.00032833405746026225, "3": 1.7124985851604603e-05, "4": 6.443897493848976e-06}, "score": 1.0021689622660337}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8751596081016851, "5": 0.056160377355166664, "4": 0.05362602970286941, "3": 0.00867887818518841, "2": 0.006363558789671041}, "score": 1.4092456396028923}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5953738806133622, "4": 0.1971801107827041, "3": 0.18285220050085746, "1": 0.02001274416718382, "5": 0.004580645737837947}, "score": 2.5709418538793685}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9777333357098142, "4": 0.021895371752422465, "1": 0.00026031399045032703, "3": 9.587512447237418e-05, "2": 9.385458824399043e-06}, "score": 4.97684333325137}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9986159611664029, "5": 0.0011324331851585603, "2": 0.00017206917186336047, "4": 6.106235516976951e-05, "3": 1.7821267687211635e-05}, "score": 1.004920634725836}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6769117967555951, "3": 0.1995002479092717, "5": 0.09766637939359635, "2": 0.024695105818043628, "1": 0.001225364412048932}, "score": 3.8450996553370063}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9561342757388033, "2": 0.04385128746208894, "3": 1.40255625057211e-05, "5": 2.1122540574407683e-07, "4": 1.1466935772322573e-07}, "score": 1.0438805312416417}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6877752953444616, "2": 0.31201319512488496, "3": 0.0002093248932178561, "4": 1.676061268815608e-06, "5": 3.846588497603036e-07}, "score": 1.3124384504470605}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5341668690386427, "1": 0.3761790094213613, "3": 0.044175055694831565, "5": 0.022892814384458005, "4": 0.022582947339824425}, "score": 1.7818396632783688}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9997363148710362, "1": 0.00021707839551751923, "3": 4.193431887746401e-05, "4": 2.549018945692092e-06, "5": 1.98578054391582e-06}, "score": 1.9998359112803021}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.997741436800771, "2": 0.002231114594982291, "3": 2.4781850683199296e-05, "4": 1.7285079123733183e-06, "5": 9.242317361960516e-07}, "score": 1.0022895607791162}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"5": 0.975640128853624, "4": 0.023934261763540094, "3": 0.0002297497235485341, "1": 0.0001732518918820103, "2": 1.3344169634648389e-05}, "score": 4.9748729659461945}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7892278078206368, "4": 0.20991581701336545, "3": 0.000824379397634145, "2": 1.7718983127769646e-05, "1": 1.0186278382109958e-05}, "score": 4.7883406563344595}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.919850645468487, "4": 0.07979778753787557, "3": 0.00034764364898591364, "2": 2.539312964345613e-06, "1": 0}, "score": 4.919499195809596}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7620995947992084, "5": 0.15515215475177674, "3": 0.08190147324053335, "2": 0.0008322971745229307, "1": 7.744946436504415e-06}, "score": 4.071563334308209}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.979754504805229, "4": 0.019845053437638312, "1": 0.0002627890339405846, "3": 0.0001271482283164681, "2": 9.23731776153358e-06}, "score": 4.978821755180094}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9581150042751645, "3": 0.03696115436045837, "1": 0.0038785209363288464, "4": 0.0010413622158144853, "5": 3.841371859833872e-06}, "score": 2.035176886081419}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9772229347608384, "3": 0.016885111865937233, "1": 0.00581749047552598, "4": 7.449034785243302e-05, "5": 3.6975067603286296e-08}, "score": 2.01121671228868}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8522358425100178, "4": 0.14498672390923814, "3": 0.001915612239757296, "2": 0.0005585157719583226, "1": 0.00030085744802441956}, "score": 4.848302703129936}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5297948091214099, "5": 0.4647664303092998, "3": 0.00541094405228909, "2": 2.6584186804084413e-05, "1": 5.018201742780004e-07}, "score": 4.459301147946971}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6188852519352908, "4": 0.37733688363677487, "3": 0.00338709620959762, "2": 0.00022546514017410862, "1": 0.0001608984720953736}, "score": 4.614567236955639}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6828051811482896, "1": 0.31591613379587985, "3": 0.0012733322446742436, "4": 5.047790172758632e-06, "5": 6.713247036203802e-08}, "score": 1.6853674205790743}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9003372568663697, "3": 0.06274858192690638, "5": 0.03651278886132561, "2": 0.0003982404855922456, "1": 2.7700643693570216e-06}, "score": 3.972959405986964}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9586327868438714, "4": 0.04111458311900821, "3": 0.0002478886263419636, "2": 3.0946213555704746e-06, "1": 5.789197326414948e-07}, "score": 4.9583779956384335}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8474960080534847, "4": 0.15103372843359963, "3": 0.001303740289248929, "1": 9.001385095277861e-05, "2": 7.428481509557633e-05}, "score": 4.8457755380576035}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.663331721389992, "4": 0.33580642537240674, "3": 0.0008575234777488802, "2": 3.080994880459812e-06, "1": 0}, "score": 4.6624688631903926}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7597479617342161, "5": 0.2327287422433361, "3": 0.007517973941455418, "2": 4.973269932971786e-06, "1": 1.1911088154275668e-07}, "score": 4.225200516157969}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6997781309258914, "2": 0.19237788311169696, "3": 0.09311698249519916, "5": 0.014705878017296323, "1": 2.0955278212732442e-05}, "score": 3.5367701846354582}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9939723620408506, "4": 0.006010325332719599, "3": 1.5147000990907457e-05, "1": 0, "2": 0}, "score": 4.993959367583551}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8196429421141298, "3": 0.17730213929732638, "5": 0.0027572650898584814, "2": 0.0002966139785714373, "1": 0}, "score": 3.82486171577562}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9726419851424906, "5": 0.02722718925470873, "3": 0.00012962537480015702, "2": 2.590232528326892e-07, "1": 0}, "score": 4.027097071337295}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9899713506595121, "3": 0.00796741962165834, "1": 0.0017342526632877983, "4": 0.00032567259209191884, "5": 1.242944992793744e-06}, "score": 2.006888241401287}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8476164034123066, "1": 0.149423817196998, "3": 0.0028444305204474904, "4": 0.00010827968525412123, "5": 6.859843019109823e-06}, "score": 1.8536577215874335}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9897467358058217, "1": 0.009409767814735985, "3": 0.00084167466668148, "4": 1.6993019650824502e-06, "5": 2.8962961874112865e-08}, "score": 1.991435391544417}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9968345562149606, "4": 0.001274052390291364, "5": 0.0009812885529587338, "2": 0.0005023195937028618, "3": 0.0004061891988054763}, "score": 1.0090620238193353}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9957110895590838, "4": 0.0022880132829415298, "5": 0.0018024880833607108, "2": 0.00019821643861042156, "1": 9.782017429927447e-08}, "score": 3.0056945779106403}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7363518628279246, "3": 0.18839615985176963, "5": 0.05282408695312269, "2": 0.02242120087736074, "1": 6.23539892078034e-06}, "score": 3.8195667372167663}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6757485767541346, "5": 0.3236481856201492, "3": 0.000557575855616362, "2": 4.516383057416564e-05, "1": 0}, "score": 4.3230004429380715}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998070873500388, "4": 0.00019156488148795473, "3": 7.978649415486417e-07, "1": 0, "2": 0}, "score": 4.999806839282409}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6974415068152063, "4": 0.2999435466100893, "2": 0.0017943696296032637, "3": 0.0008145711333275997, "1": 0}, "score": 4.69304235870463}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6386976996715433, "5": 0.3563047767217737, "1": 0.003118244798633793, "3": 0.0014953170814694186, "2": 0.00038082561158316643}, "score": 4.344694155021746}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9257181132648447, "1": 0.04159259218698259, "3": 0.030527920130194498, "4": 0.0021080778884616834, "5": 5.306972197360391e-05}, "score": 1.9933106913688703}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9145642249849301, "2": 0.08539415697711954, "3": 4.0870419344212444e-05, "4": 6.397284803916333e-07, "5": 1.0757086470518906e-07}, "score": 1.085478247311998}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9960285292325338, "3": 0.0037151322593723755, "4": 0.00017460644540092534, "1": 5.769673337524943e-05, "5": 2.3850938292480073e-05}, "score": 2.0040782019836603}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9997577514469204, "3": 9.883873256737387e-05, "1": 7.892220006849937e-05, "4": 5.475022936288508e-05, "5": 9.669151480216014e-06}, "score": 2.0001584244564756}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9646445137936389, "4": 0.034340309868827856, "5": 0.0009973128957273235, "2": 1.708065536540675e-05, "1": 0}, "score": 3.0363178834340636}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9953742478994413, "3": 0.0039948230244768335, "1": 0.0004948125767120848, "4": 0.0001348619358830506, "5": 1.311998514085241e-06}, "score": 2.0037736700983317}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9984016722884271, "1": 0.0012186312211145867, "3": 0.00037174515710452084, "4": 7.77594160872775e-06, "5": 5.992734051401679e-08}, "score": 1.9991688455052605}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7384043165465333, "5": 0.18199632216393336, "3": 0.05044706551895509, "2": 0.029070714096208657, "1": 8.122479502158855e-05}, "score": 4.073164180178281}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9991298919237583, "2": 0.0008611559012077701, "3": 7.326548691116122e-06, "4": 7.790754038970945e-07, "5": 6.931676138321199e-07}, "score": 1.0008809190303753}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4038991099720984, "5": 0.23376510326553024, "2": 0.1443496063397822, "1": 0.14031304736652328, "3": 0.0776666755272336}, "score": 3.4464564984360404}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8922271735139293, "3": 0.09858886054232618, "1": 0.008342867473016524, "4": 0.0008363829295929536, "5": 4.621399392156566e-06}, "score": 2.0919326317813707}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.854254662497893, "5": 0.09686006218482322, "1": 0.03775828715858416, "3": 0.00904667040514385, "2": 0.002078590207343436}, "score": 3.970381298721564}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8750445059282919, "5": 0.06263004274153339, "3": 0.06009462955016474, "2": 0.002228503488892555, "1": 2.0701758553914934e-06}, "score": 3.9980721952076994}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999781115595554, "4": 1.788425215889065e-05, "3": 2.193083529733805e-06, "5": 1.5138000182736015e-06, "1": 0}, "score": 2.000042503000539}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8844791042724696, "3": 0.08398676937373173, "4": 0.018436637972665943, "1": 0.012928423750630162, "5": 0.00016850738183864938}, "score": 2.108437204140437}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.88865283637639, "4": 0.09597156781256522, "3": 0.015195772725107698, "5": 0.00012655988026732699, "1": 5.320889374133256e-05}, "score": 2.207465390365144}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4129391225139225, "4": 0.342331367565702, "2": 0.2328640435030653, "1": 0.01095749589829415, "5": 0.0009078312905369223}, "score": 3.0893680072896936}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7063839858762253, "5": 0.2855721120980414, "3": 0.007668274931857374, "2": 0.0003717700648644473, "1": 2.6601235204217978e-06}, "score": 4.27715264839142}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.8111624797407361, "3": 0.14910223013690463, "4": 0.03300092129087669, "1": 0.006620006017802652, "5": 0.00011415881100646806}, "score": 2.2088265857350566}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9715580703934292, "4": 0.02241576887850139, "3": 0.0054308061163775775, "5": 0.0005034113141745679, "1": 9.175587870529064e-05}, "score": 2.051680831623159}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9255758265155012, "3": 0.06290626611293927, "1": 0.010834429487193573, "4": 0.0006807414405826945, "5": 2.67119398531105e-06}, "score": 2.053441336575904}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9656743793621191, "1": 0.019276822721170112, "3": 0.014839822533105814, "4": 0.00020771118018587018, "5": 7.330136596260769e-07}, "score": 1.9959806190782323}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.872547417218527, "3": 0.11101408431482175, "4": 0.015792217872530562, "5": 0.0006450240210009657, "1": 7.007084095505083e-07}, "score": 2.144532971755255}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9998659569845679, "4": 7.442355996925329e-05, "3": 5.480618529680677e-05, "5": 3.996022765988008e-06, "1": 6.432463886660538e-07}, "score": 2.000214998164554}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6005022443501844, "3": 0.3446907985146419, "4": 0.054505672508739764, "5": 0.0001776992577137623, "1": 0.00011740770762995298}, "score": 2.454120639001035}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6088110634787465, "4": 0.23336453969487067, "5": 0.10186682052190572, "2": 0.055926038626706844, "1": 3.067185803991426e-05}, "score": 3.3811111283694295}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.993413590509172, "4": 0.006574327417940732, "3": 6.505315148862527e-06, "2": 4.285857111054551e-06, "1": 0}, "score": 4.9933997958602205}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999582051834277, "4": 3.7414209221078306e-05, "3": 2.4874140854916403e-07, "1": 0, "2": 0}, "score": 4.999962088151316}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8774360445517251, "4": 0.12010544664603501, "3": 0.002376065525000113, "2": 7.460716573042155e-05, "1": 0}, "score": 4.8749176206473015}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9708336214536917, "4": 0.028988354459752258, "3": 0.00012686741413813182, "2": 3.0586127545058684e-05, "1": 1.6055067919581666e-05}, "score": 4.970601799310761}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7612979754547402, "2": 0.22985008199438214, "4": 0.008333131192302081, "1": 0.000491413954914998, "5": 2.7299204374206717e-05}, "score": 2.7775547978528787}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.619741991683664, "3": 0.35685990399712686, "2": 0.020745726610442876, "5": 0.0026186996531659366, "1": 3.329028317850607e-05}, "score": 3.6041673180926197}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7944062728066986, "2": 0.18930445253352987, "3": 0.010988010007315772, "4": 0.004854158590914389, "5": 0.00044668451300356187}, "score": 1.2276297823299207}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9572914867975097, "1": 0.02795792716763728, "4": 0.014685039860012955, "3": 4.842903632761249e-05, "2": 1.5909693188386296e-05}, "score": 4.873338511380395}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9213519746406035, "2": 0.07855824144904909, "3": 8.859696110341384e-05, "4": 1.0304365608854664e-06, "5": 7.191039549400723e-08}, "score": 1.078738820984005}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8914946792576547, "3": 0.10504249462327939, "4": 0.001886837748744014, "1": 0.0015685577694419866, "5": 7.31063807536745e-06}, "score": 2.107269557133908}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.4195622932745446, "4": 0.26382995320916786, "2": 0.19475393286625214, "3": 0.11322065105917352, "5": 0.008632906848090878}, "score": 2.24721704970173}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7898716461098134, "3": 0.15958059285707876, "2": 0.04074362065067281, "5": 0.009369417979273983, "1": 0.0004336562016009255}, "score": 3.767000366791474}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6526875814177905, "4": 0.2561285530990046, "2": 0.08962586757978748, "3": 0.0015398879884109306, "1": 1.5558522480324605e-05}, "score": 4.471850486578168}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5899456883285474, "3": 0.18317474336030165, "1": 0.14574299742751126, "4": 0.08007533499341545, "5": 0.0010598600583480427}, "score": 2.2007622723097993}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.974247643061514, "1": 0.02280798922029779, "3": 0.002906404874203371, "4": 3.549882360213527e-05, "5": 2.311992155753685e-06}, "score": 1.9801763462638222}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8174802545157357, "2": 0.17796649086133295, "3": 0.0038412467138872423, "4": 0.0006797839709823723, "5": 3.219398255665926e-05}, "score": 1.187817117758438}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9762264558949804, "4": 0.022449619807841794, "3": 0.0013208599199244508, "2": 7.55945918274266e-07, "1": 0}, "score": 4.97490633458755}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7826410165192909, "4": 0.20632186048022305, "3": 0.007419675172887356, "2": 0.003615695677417794, "1": 1.2091523270702897e-06}, "score": 4.767986739549739}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5540662026533815, "3": 0.4458369396402901, "4": 7.317271151593018e-05, "1": 1.8168540563471033e-05, "5": 4.558613671815199e-06}, "score": 2.4459792195407672}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"2": 0.938623264072946, "1": 0.058873676896124424, "3": 0.0024047171295322974, "4": 9.749192538052077e-05, "5": 7.809927266642207e-07}, "score": 1.943728363180546}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5908673363233893, "4": 0.345841085462999, "5": 0.025321863157346317, "3": 0.022859735296802252, "2": 0.015107146031321038}, "score": 2.1996407250989916}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7758541868490809, "3": 0.20094123034893155, "2": 0.017562567297664967, "5": 0.005444501928323327, "1": 0.0001971580237031237}, "score": 3.7687865807044902}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6021474681305544, "3": 0.3203340888980364, "2": 0.0743074695507413, "1": 0.0018968550520294563, "5": 0.0013135846562775761}, "score": 3.526673738880594}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9228766811132221, "5": 0.07487277044636632, "1": 0.0014394506949637917, "3": 0.0006758572992426902, "2": 0.00013455547371181407}, "score": 4.069609497795399}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6177044822205933, "4": 0.3734324565448503, "3": 0.008411617440543091, "2": 0.0004297846021560956, "1": 2.12980934211362e-05}, "score": 4.608369620976793}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9943686100574852, "4": 0.005555928628582675, "3": 7.211784794456403e-05, "2": 1.8429076298215995e-06, "1": 0}, "score": 4.994294298390901}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9773175530885111, "3": 0.021215246102382748, "4": 0.0014622197809290157, "2": 2.1657669712650174e-06, "1": 0}, "score": 4.956100667125303}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8460895786942075, "1": 0.07577180660859147, "4": 0.06839148160826375, "2": 0.00730943718982849, "3": 0.0024312574167765283}, "score": 4.60172790128646}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.998672905369939, "5": 0.0010063272117513589, "4": 0.0002937936229123673, "3": 2.6287737033759467e-05, "1": 4.0764546444508493e-07}, "score": 2.003632449983969}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.708446503079524, "2": 0.29149544482094003, "3": 5.766731554341279e-05, "4": 3.8670334045786073e-07, "5": 3.110065365924322e-08}, "score": 1.2916120543356324}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7502264910307435, "3": 0.22267697506123565, "4": 0.025988113982678557, "1": 0.0010312619835198648, "5": 7.71375011043845e-05}, "score": 2.2738533591441454}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9975561138640927, "4": 0.002438653344563665, "3": 2.8620597501111985e-06, "2": 1.0438727112784058e-06, "1": 4.7293588846427513e-07}, "score": 4.997550597082647}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9392669804109691, "4": 0.0598084992618628, "1": 0.0005541650452341048, "3": 0.00018808002891400338, "2": 0.00018096588954697484}, "score": 4.937055700413764}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9470208302479558, "3": 0.029863950347254607, "5": 0.022187586792045275, "2": 0.0009273819956375802, "1": 0}, "score": 3.990468870064851}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8677164918214455, "3": 0.1169373450518144, "5": 0.00887233030125142, "2": 0.0064684568979815685, "1": 3.6504869073236924e-06}, "score": 3.8789869111918556}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.876773102633427, "4": 0.08549069836587457, "5": 0.020060028012773408, "2": 0.014535544272847895, "3": 0.003135077450809592}, "score": 1.3575198902955368}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9990682513475985, "4": 0.0009265075160197892, "3": 3.713034838385969e-06, "1": 5.360266269306787e-07, "2": 0}, "score": 4.999063921379135}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6115588253715517, "4": 0.3879297548307487, "3": 0.0004719934262085341, "2": 2.437377009486397e-05, "1": 7.610824862851088e-06}, "score": 4.6110197990033654}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.998174998044982, "5": 0.0017463008993769933, "4": 6.125886403937617e-05, "2": 1.2488104584330203e-05, "3": 3.914758172130815e-06}, "score": 1.0071893052826069}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"1": 0.562925008239203, "2": 0.3910722865489412, "3": 0.039457031866812646, "4": 0.006255595098127609, "5": 0.0002897349553375384}, "score": 1.4899122435810468}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7646862729414761, "5": 0.20647269560430334, "3": 0.02502114529027519, "2": 0.003782386951470808, "1": 3.610901502922466e-05}, "score": 4.173778690952689}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9935005301220702, "4": 0.0064882592797332935, "3": 9.970159261957573e-06, "1": 0, "2": 0}, "score": 4.993491792328708}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9482979204680555, "4": 0.050294004691706966, "3": 0.0014066274769198627, "1": 0, "2": 0}, "score": 4.946892663488843}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9112440638263442, "5": 0.08759800984169296, "3": 0.001131121794727685, "2": 2.6386685820702693e-05, "1": 1.0194371394925138e-07}, "score": 4.086413836142978}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8363291778406956, "2": 0.10030224514175656, "3": 0.04611191050430449, "4": 0.016539149690311884, "5": 0.0007163526387695522}, "score": 1.2450092110122226}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9975321524549977, "3": 0.0018406178052397686, "1": 0.0004902799517031616, "4": 0.0001341946768514384, "5": 2.6797742555313476e-06}, "score": 2.0016267666525622}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9824843000099845, "5": 0.015846882273414468, "3": 0.0008828157877670889, "4": 0.0007858127700137662, "1": 0}, "score": 2.049995097605052}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9999865748701179, "2": 1.0926746140062836e-05, "4": 1.5255462733724644e-06, "5": 7.452053641320887e-07, "1": 0}, "score": 2.9999920892090604}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9984254348305248, "1": 0.001352692808888881, "3": 0.00021520898041378747, "4": 6.2446341435622115e-06, "5": 3.1198148308022503e-07}, "score": 1.9988759412642516}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6752968547309501, "1": 0.3087114367670814, "3": 0.015585664960099221, "4": 0.0003900709157945454, "5": 1.5930612266059953e-05}, "score": 1.7077021495808593}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9189062912476875, "2": 0.08038462117590611, "3": 0.0005910124942019487, "4": 9.738610661954501e-05, "5": 2.0609941530788815e-05}, "score": 1.0819412507264412}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5500776824010343, "2": 0.3693673875632362, "3": 0.06543253939415179, "5": 0.010333538588077867, "4": 0.004786112900659271}, "score": 1.555926482173432}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8746917591020406, "4": 0.07811172541896085, "1": 0.045815931454302135, "3": 0.0008504138029004466, "2": 0.0005250922481741927}, "score": 4.7353471005130645}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7960076520944325, "4": 0.18776494330508792, "1": 0.0104727147423126, "3": 0.004549390550207738, "2": 0.0011998412771238082}, "score": 4.757644570010464}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5762516853442889, "3": 0.3963100379249155, "2": 0.019652388419246027, "5": 0.007757559435413473, "1": 2.8333066721946278e-05}, "score": 3.5720577472651693}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8074808656141065, "3": 0.14805170620236466, "4": 0.03132244956594704, "1": 0.013106748876804077, "5": 3.8248775931295294e-05}, "score": 2.197704599021912}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998976540877003, "4": 0.00010087554789135646, "3": 1.3481126240037137e-06, "1": 0, "2": 0}, "score": 4.999896428214199}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.835662746974635, "4": 0.15543028124887023, "1": 0.004721818396877671, "2": 0.003198357123234694, "3": 0.0009864921400941445}, "score": 4.814114332982867}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9996698336369138, "4": 0.00015876967354934616, "1": 8.114450341005878e-05, "5": 6.579280974473562e-05, "3": 2.4381058941750643e-05}, "score": 2.0004581543677467}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"2": 0.975479128346243, "3": 0.012565874654792522, "1": 0.011900534070473522, "4": 5.426837029034419e-05, "5": 1.125950593601118e-07}, "score": 2.000774215173535}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7315369625476359, "1": 0.18374488095969513, "3": 0.08076302738874981, "4": 0.003922821945954585, "5": 3.210056264821956e-05}, "score": 1.9049600723741043}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9537251259363516, "4": 0.03762194331540074, "3": 0.004218134543377737, "1": 0.0024846228539148066, "5": 0.0019496264282807556}, "score": 2.0828263229047006}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8470294374291161, "5": 0.13681540096183245, "4": 0.01514023362673125, "2": 0.0005115143081709987, "3": 0.0004914880165784098}, "score": 1.5941838811023517}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8732570954428559, "5": 0.06118330015407364, "4": 0.05015074044886194, "2": 0.013408693684074033, "3": 0.0019948195178017764}, "score": 1.4125859623278583}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7602901060886875, "3": 0.1324299304799977, "1": 0.08959324970080253, "4": 0.017516762488828386, "5": 0.00016964560047847628}, "score": 2.0783791665141904}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5548298105052625, "3": 0.29624238248327767, "2": 0.13620100587704229, "5": 0.010738949570913361, "1": 0.001986828361238131}, "score": 3.43613349330035}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9668003510961996, "4": 0.03232560947177585, "3": 0.0008721082516149333, "2": 5.985971515853252e-07, "1": 0}, "score": 4.965928332830207}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999655955278475, "3": 3.300557735569069e-05, "1": 8.908809787929904e-07, "4": 3.8557350024600237e-07, "5": 0}, "score": 2.000032885847404}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8963888731054882, "1": 0.07793381017864241, "4": 0.025156657644317067, "2": 0.00026170385969211503, "3": 0.00025045983239933427}, "score": 4.661819197422994}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5333270183959858, "2": 0.30972517715665976, "4": 0.1534058124436299, "1": 0.0021680340279045113, "5": 0.0013732479205461497}, "score": 2.8420909509481005}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9984893760427471, "3": 0.0012436698671365466, "4": 0.0002141703139267172, "1": 5.2007844239503323e-05, "5": 6.486419288524632e-07}, "score": 2.001621948782995}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8864680931944775, "3": 0.09038792441379136, "5": 0.023074090830449978, "2": 6.898937849991713e-05, "1": 0}, "score": 3.9325481268057403}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7534568941879285, "1": 0.22625382284327153, "4": 0.019457915988882923, "3": 0.0006213808369441963, "2": 0.00020828775433992414}, "score": 4.073657594411711}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8466106425868659, "5": 0.14767495064537492, "3": 0.00567114637011674, "2": 4.1284022386692184e-05, "1": 8.750165819223149e-07}, "score": 4.141918767484205}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7905501527548155, "3": 0.14472426031488553, "5": 0.038396268445837003, "2": 0.026313651658586505, "1": 1.5089038574063215e-05}, "score": 3.8409993458294975}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8440487039071369, "5": 0.13203783086432036, "3": 0.023832597322513274, "2": 7.922132819547335e-05, "1": 7.389334309211266e-07}, "score": 4.108044672151265}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9883989778641454, "4": 0.01159293984748592, "3": 7.062912896354392e-06, "1": 0, "2": 0}, "score": 4.988392922494752}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8637951700373957, "4": 0.13607762282489136, "3": 0.00012223941722781993, "2": 1.2598637219913697e-06, "1": 0}, "score": 4.863673613270772}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8861086057819701, "5": 0.08092426999261107, "3": 0.032374538949691764, "2": 0.000586559761453683, "1": 5.872612285700829e-06}, "score": 4.047359000924439}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"2": 0.951903383748625, "1": 0.044365302068774745, "3": 0.003701271017787212, "4": 2.915911503145159e-05, "5": 7.71861273969317e-07}, "score": 1.9593965982076622}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8037310425181818, "3": 0.17649500558111553, "4": 0.01943174130899093, "1": 0.00029855272725813007, "5": 4.3593696227514627e-05}, "score": 2.2151907303689296}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5379803734833511, "5": 0.2773514789675191, "3": 0.13771778830504644, "2": 0.04694754332701859, "1": 9.107740450807418e-07}, "score": 4.045735958819843}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9925472921843257, "3": 0.005247788653337925, "4": 0.001962508062570443, "1": 0.0002355112205488839, "5": 6.818234435837123e-06}, "score": 2.0089577489925907}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9997445341369622, "4": 0.00015333921487568295, "3": 9.380663207755423e-05, "5": 6.396247932905732e-06, "1": 1.6863890023458346e-06}, "score": 2.000417987515847}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9209776961614808, "5": 0.04283856631495732, "3": 0.0348725776261976, "2": 0.0013079280959152936, "1": 2.8948854961538207e-06}, "score": 4.00534144964006}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9682947405617759, "4": 0.03161890113558407, "3": 7.981093761948159e-05, "1": 4.236267428074888e-06, "2": 2.0758102470360087e-06}, "score": 4.968198297006186}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9973457086770419, "5": 0.0022132749113160676, "4": 0.00040539486116043046, "3": 3.2981689965963684e-05, "1": 2.4616960361229207e-06}, "score": 2.0074811357830717}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7133412225827954, "1": 0.25195184525215797, "5": 0.016317355222887627, "4": 0.013308943847820004, "3": 0.005079835499013571}, "score": 1.8286978069813302}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9615463492181993, "5": 0.01730482352268989, "4": 0.012876864852608649, "2": 0.0073603263955735075, "3": 0.0009094750436679478}, "score": 1.1170294180282359}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5004440123102678, "1": 0.4899340444992623, "3": 0.009403954374764451, "4": 0.00021352342763588799, "5": 4.344686299052717e-06}, "score": 1.5199099328419499}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9953484983984001, "2": 0.004650972227753482, "3": 5.017383842556615e-07, "4": 3.037594249861917e-09, "5": 0}, "score": 1.0046519849317337}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7470865478387952, "3": 0.2030500253507596, "5": 0.049478749728330745, "2": 0.0003833032908660841, "1": 4.866683266467383e-07}, "score": 3.8456605208727694}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6057436695127719, "4": 0.32864685295224183, "1": 0.03034989564099514, "3": 0.02695053851023132, "5": 0.008307969866675044}, "score": 2.678818987097525}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5570088224234224, "4": 0.315150587132251, "3": 0.1277856280417178, "2": 5.3584377335163956e-05, "1": 0}, "score": 4.429116616960577}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"2": 0.933961754186651, "1": 0.0585343802961915, "3": 0.0074257766532443426, "4": 7.65923772405882e-05, "5": 1.3935640885727188e-06}, "score": 1.949048756559766}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7847732864363337, "1": 0.14545449360766524, "3": 0.06573101466255975, "4": 0.004009761964096527, "5": 3.128616721863233e-05}, "score": 1.9283898922303464}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8083207996390916, "3": 0.09224990738671991, "5": 0.058805493592373186, "2": 0.04045055155883076, "1": 0.00017270717977381093}, "score": 3.8851362994483902}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8802804227992922, "4": 0.11908913888740713, "3": 0.00033026522968519995, "2": 0.0002790596499195093, "1": 2.073324722564111e-05}, "score": 4.879330172837527}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.926482862925844, "5": 0.030666752245223076, "2": 0.021201676929167825, "3": 0.016998961925436033, "1": 0.004648746805031414}, "score": 3.9573181533999655}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8965781889109289, "5": 0.0826122173158387, "3": 0.02000814176532187, "2": 0.0007973953137075423, "1": 3.901119479472147e-06}, "score": 4.060997591054347}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9143584711824793, "3": 0.04875106186155563, "1": 0.032823688956071836, "4": 0.004041025833734097, "5": 2.5634101578941638e-05}, "score": 2.0240863297214307}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9597436964798559, "5": 0.034121953642886144, "3": 0.006133210073188462, "2": 6.23418995046237e-07, "1": 0}, "score": 4.02798751118404}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9420769837677686, "3": 0.05186530030432009, "5": 0.0044127111728419904, "2": 0.0016447695430325904, "1": 0}, "score": 3.949257859847294}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9191702978625191, "4": 0.07945805552600518, "3": 0.0010300293314604411, "5": 0.0003411362160113494, "1": 2.94527046312094e-07}, "score": 2.160969284531179}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9319655802879739, "4": 0.06746669569332489, "3": 0.0005568292043379166, "2": 9.410391505237444e-06, "1": 0}, "score": 4.93139131287918}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7136486675498674, "4": 0.28515434040942333, "3": 0.0011057995842861147, "2": 9.034589286602144e-05, "1": 0}, "score": 4.712362779240218}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9794522599392363, "4": 0.020519894500375942, "3": 2.6387873248281547e-05, "1": 0, "2": 0}, "score": 4.979427299764566}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8630432528304474, "5": 0.07553409766325608, "3": 0.05947745177615474, "2": 0.0019415823384166633, "1": 1.885089986514034e-06}, "score": 4.012167846994355}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.959573753395677, "4": 0.0403560805682518, "3": 6.865771846162643e-05, "2": 4.189911663262909e-07, "1": 0}, "score": 4.959505302909382}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8154550075953275, "3": 0.10866543724976589, "2": 0.04176293730992502, "5": 0.03410829053667182, "1": 7.950195805330629e-06}, "score": 3.8418930684555392}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8534068086471382, "5": 0.14578697472347668, "3": 0.000801275279619458, "2": 1.7582615372493552e-06, "1": 0}, "score": 4.144982644413331}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9974086824747233, "4": 0.0025885388837614187, "3": 3.750100542507818e-07, "1": 0, "2": 0}, "score": 4.9974107048724195}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8934023371947408, "5": 0.10207991419012398, "3": 0.004409072187412285, "2": 0.00010505663208656827, "1": 1.4846685637708012e-06}, "score": 4.097456482814823}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9215976398227564, "4": 0.07834602855326822, "3": 5.491785690219776e-05, "2": 1.3095016578184768e-07, "1": 0}, "score": 4.921543642237287}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8092036929451987, "1": 0.12043255407156792, "3": 0.0668969569118409, "4": 0.0034269161632047764, "5": 3.979895111164195e-05}, "score": 1.953437628250464}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7740423663531842, "5": 0.2189776082120833, "3": 0.0069149053610269694, "2": 6.018027001396546e-05, "1": 4.429175981055918e-06}, "score": 4.211929162999987}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5844157609578369, "5": 0.2193470281281231, "4": 0.18681615015351144, "3": 0.009158993374027225, "1": 0.0002615055633302842}, "score": 3.0405714571192446}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8766926623915129, "4": 0.12317021727561206, "3": 0.00013494989453665128, "2": 1.0961626249685317e-06, "1": 0}, "score": 4.876556461835045}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.45235271524372245, "4": 0.4396059154963948, "1": 0.09970436715647457, "3": 0.006272723805059515, "2": 0.002058170083379516}, "score": 4.142851422369677}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9537413880421162, "3": 0.028661354405645344, "1": 0.01748131295033941, "4": 0.00011453478293619238, "5": 1.1943254606836735e-06}, "score": 2.0114126964569223}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5881339799389217, "2": 0.392496719404382, "4": 0.01894278421840926, "1": 0.00039399789158017936, "5": 3.228854611716929e-05}, "score": 2.6257225600390695}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.49440468339361404, "3": 0.4872579620197059, "2": 0.014671541704760722, "5": 0.0036466403037556747, "1": 1.871944003542074e-05}, "score": 3.4869892040896704}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8966653979329755, "5": 0.07812651336821791, "3": 0.024842514479672857, "2": 0.0003608980678604472, "1": 2.806178400723884e-06}, "score": 4.052553882491957}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9520204941062042, "4": 0.047862804510747856, "3": 0.00010895354055922633, "2": 3.20048243046934e-06, "1": 2.971614946201275e-06}, "score": 4.951897724704132}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5235738127728142, "5": 0.46373328909789324, "3": 0.012194734728882512, "2": 0.0004205952870754056, "1": 7.329479215196675e-05}, "score": 4.4504794044615865}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7090203857801259, "5": 0.2801897574984084, "3": 0.010630943843758352, "2": 0.00015009982278076586, "1": 0}, "score": 4.269260987020956}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6520968729160594, "4": 0.34666045290083, "3": 0.0012353049701425852, "2": 6.1224451923605595e-06, "1": 0}, "score": 4.650850134514506}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6629914266673619, "4": 0.3365213111852703, "5": 0.0004728835000097584, "2": 1.1469468111992521e-05, "1": 0}, "score": 3.337456590438887}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9698567876332606, "4": 0.028937489788990668, "2": 0.001125090614890636, "5": 7.993082378891004e-05, "1": 0}, "score": 3.0279722804341365}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9980758360815041, "1": 0.0014919022431859321, "3": 0.0003540740804201992, "4": 7.18382136466384e-05, "5": 6.127093892219991e-06}, "score": 1.9990242293293026}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9912402560931811, "3": 0.005924959070009955, "4": 0.0026645635656762216, "5": 0.0001576430906629881, "1": 1.2553425266793692e-05}, "score": 2.0117144623380785}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9871009985096978, "4": 0.009200697339756788, "1": 0.0029943302354071815, "3": 0.00042829403525431955, "2": 0.00027488767452813823}, "score": 4.977140712515272}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5787557143636155, "3": 0.29385348094523134, "4": 0.11384513716873651, "5": 0.00809372992819121, "1": 0.005451677061150794}, "score": 2.540373408791273}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9948720580158359, "4": 0.004741645744762305, "1": 0.00020527377130336033, "3": 0.00011653743571111093, "2": 6.22463287663221e-05}, "score": 4.994017431919107}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5884871192188086, "3": 0.2214361484285553, "4": 0.18045740724437798, "5": 0.005612359834691261, "1": 0.0040067974405638175}, "score": 2.595181344871894}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9437183145210056, "5": 0.03442118710427119, "4": 0.016698230888354326, "2": 0.0035784161237543484, "3": 0.0015822922376339422}, "score": 1.1945227449664408}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987102386580181, "4": 0.0012231648987606593, "3": 3.8118607851697094e-05, "2": 2.8208731508050275e-05, "1": 0}, "score": 4.998615971318565}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986222629523095, "1": 0.001256223852881703, "4": 0.00012044184929220048, "3": 3.5494499611380914e-07, "2": 0}, "score": 4.994853949162556}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9519242316129262, "5": 0.03294042342114462, "4": 0.015103220194252115, "3": 3.162422870464278e-05, "1": 0}, "score": 2.1290593994804174}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8133633616362155, "5": 0.18028733414864864, "3": 0.005546301332285189, "2": 0.00080255489525296, "1": 0}, "score": 4.173136000588639}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7343859287927538, "5": 0.2495298079961983, "3": 0.01598791107711865, "2": 9.57038529122212e-05, "1": 2.7595031653163717e-07}, "score": 4.233349748245581}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9985754209774189, "4": 0.0013514902587579696, "3": 6.514148248055756e-05, "2": 7.712015429074732e-06, "1": 0}, "score": 4.998495090375941}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5464219825106273, "4": 0.44640214179441007, "3": 0.007165988248481757, "2": 9.178378526804742e-06, "1": 0}, "score": 4.539238019861491}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.970953081142378, "5": 0.0264300911933291, "2": 0.0025071603523615918, "3": 0.00010857601838869946, "1": 7.353509269828591e-07}, "score": 4.021304996000793}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7132837295972536, "2": 0.2841259651201184, "4": 0.0023852698890900843, "1": 0.00014968013111950392, "5": 5.515633225990525e-05}, "score": 2.7180702010869133}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9630129497252715, "2": 0.036967874509164105, "3": 1.8684317917026037e-05, "4": 1.637509763509951e-07, "5": 1.6200259229841294e-07}, "score": 1.0370063885400358}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9251121181537887, "2": 0.07447133445921736, "3": 0.000393606845860173, "4": 2.0887785409643106e-05, "5": 2.1339155061235526e-06}, "score": 1.0753297410554457}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9928211211429449, "4": 0.006429584254351728, "3": 0.0003421381346373205, "2": 0.00024029721619393569, "1": 0.00016576871902183296}, "score": 4.991502163684534}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9946445050704087, "1": 0.005339779067464041, "3": 1.0288667614805873e-05, "4": 3.1673065500567224e-06, "5": 2.3393393441910565e-06}, "score": 1.994683862653658}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5821916092022973, "1": 0.381547052631684, "3": 0.03532044868151191, "4": 0.00091950470226137, "5": 2.1389551560569246e-05}, "score": 1.6556765757512193}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.879940040171508, "2": 0.09406959484122042, "4": 0.023435788544947257, "5": 0.002554017932646506, "1": 4.1681639994686204e-07}, "score": 2.934473386651539}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9634177506023734, "4": 0.03625509339874966, "3": 0.00032564230594918126, "2": 7.561009030729108e-07, "1": 0}, "score": 4.963091325724926}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7667881666885118, "4": 0.23232426249445698, "3": 0.000740070578472427, "2": 0.0001467538301158095, "1": 4.209305421044774e-07}, "score": 4.765753574894046}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8324905571122303, "4": 0.13855774622464956, "5": 0.027382430332611323, "2": 0.0015687345558643303, "1": 1.962228173884213e-07}, "score": 3.1917535442316245}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"1": 0.901310305000152, "2": 0.09853854377346735, "3": 0.00014757810454395185, "4": 2.0902497531754433e-06, "5": 1.3316523745165333e-06}, "score": 1.0988453122886723}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.965344772740738, "1": 0.02688667683534102, "4": 0.007632727706480488, "3": 8.028939604223865e-05, "2": 5.122468567613306e-05}, "score": 4.884505814480669}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9467850419490562, "4": 0.05311466031739094, "3": 9.853260986073751e-05, "2": 1.0658254378414009e-06, "1": 0}, "score": 4.9466850397035165}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7603474341239264, "2": 0.19765849700581442, "4": 0.019318057475482684, "3": 0.01763145070143357, "5": 0.00504418592970276}, "score": 1.3110524311250822}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7200559727954156, "5": 0.2451306610962565, "3": 0.019470437293284314, "2": 0.013373528646361977, "1": 0.0019675345843750244}, "score": 4.193010922835271}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6036127071743401, "1": 0.38955370160164954, "3": 0.006169194503953567, "4": 0.0005728838883019064, "5": 9.114125520043824e-05}, "score": 1.6180345425151006}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.567662782129895, "4": 0.24540509129430063, "5": 0.07950574466463169, "2": 0.06578485067903027, "3": 0.04163370597493016}, "score": 2.203299931301785}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999415206418459, "4": 0.0005621577800797024, "3": 2.1741645264389075e-05, "1": 0, "2": 0}, "score": 4.999394358387853}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7615157225839387, "4": 0.2381975279877425, "3": 0.00027750239338615644, "2": 5.414792487700016e-06, "1": 0}, "score": 4.761230307824674}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9179755341220209, "1": 0.0775441598797505, "4": 0.00437561017642631, "2": 5.950388222870249e-05, "3": 4.3096490115755e-05}, "score": 4.685182385993256}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"2": 0.558732786884266, "1": 0.435031994510202, "3": 0.006103393811342197, "4": 0.00012563357786117722, "5": 6.079239208479049e-06}, "score": 1.5713408561744715}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9715974513548054, "1": 0.02458485195248256, "3": 0.003620149339463275, "4": 0.00019541305674289277, "5": 2.051088356673777e-06}, "score": 1.979432275054134}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5108516214122254, "5": 0.4864178260744454, "3": 0.0026395601118672247, "2": 8.96906527513393e-05, "1": 6.69779689685449e-07}, "score": 4.483597180936443}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5673116948112688, "4": 0.26303409931993615, "1": 0.11986914374325444, "2": 0.034332934362425786, "3": 0.015414117017772507}, "score": 4.123628977068445}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9560557134131431, "4": 0.04391892317301645, "3": 2.340221223762043e-05, "1": 0, "2": 0}, "score": 4.956034186176683}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9633116388714495, "3": 0.030576134274316342, "4": 0.006092977502953778, "1": 1.3722263103973011e-05, "5": 5.461066268513517e-06}, "score": 2.042764753039336}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9149545345111595, "5": 0.08482673624232102, "3": 0.0002147656766993752, "2": 3.0637313176283654e-06, "1": 0}, "score": 4.084605919234649}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9681461129172406, "4": 0.031671381425856, "3": 0.00014936762632672683, "2": 3.04340351046152e-05, "1": 1.989743145841292e-06}, "score": 4.96793059933795}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7767511889791104, "5": 0.22321672912651921, "3": 2.3606085948596758e-05, "1": 0, "2": 0}, "score": 4.2231950147987565}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7051366254367066, "3": 0.2816639458623566, "4": 0.013141370125690806, "2": 5.48474424723081e-05, "1": 0}, "score": 4.423364344168526}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7930284750376287, "1": 0.20561933664371868, "3": 0.0008089724466620014, "4": 0.0005074542494393335, "5": 3.572263630314845e-05}, "score": 1.7963117042696888}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9781574491050555, "4": 0.021421658271263334, "3": 0.0002456003344316078, "2": 0.00017311282645507062, "1": 0}, "score": 4.977567753690262}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.995402470643284, "4": 0.004591875650162399, "3": 4.809372210174552e-06, "2": 1.66777207840574e-07, "1": 0}, "score": 4.995398002155677}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9830176949800378, "4": 0.015921646190274523, "1": 0.0007655913624159509, "2": 0.00017050106754488184, "3": 0.0001224943073097643}, "score": 4.980259455638575}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993631792064882, "4": 0.0004277926253545361, "1": 0.0002041092843422659, "3": 2.23455378187338e-06, "2": 1.6226044734907512e-06}, "score": 4.998746431985346}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9185191181582748, "3": 0.044016060513234805, "1": 0.03644607893914288, "4": 0.001014548594393326, "5": 4.144932724613689e-06}, "score": 2.0096115140306923}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6118451080037558, "3": 0.37501346012095804, "4": 0.012897155445896868, "1": 0.00021691087566716197, "5": 2.72460227945691e-05}, "score": 2.4006726460982413}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7793624229747006, "2": 0.2201808995119722, "3": 0.000441218959029407, "4": 1.4421491481597466e-05, "5": 1.0082630097282085e-06}, "score": 1.2211106413244586}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6081398542681254, "5": 0.3011440672505777, "3": 0.08571726629364734, "2": 0.0049864901173768995, "1": 1.1308029605885933e-05}, "score": 4.205420104937698}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.961392727538623, "3": 0.02317750923584474, "4": 0.009518217358225488, "1": 0.005736385332670463, "5": 0.0001748853397863046}, "score": 2.0370022248218063}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8905394644972335, "3": 0.06756062067944496, "5": 0.039920683737207203, "2": 0.0019469629150499566, "1": 3.172254281510492e-05}, "score": 3.9683709523415143}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8468032768864446, "5": 0.06896707239177717, "3": 0.0588176381806856, "2": 0.02470822240137768, "1": 0.0007031075434310301}, "score": 3.9586236385346925}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7928458061093626, "4": 0.11334350546100544, "2": 0.09352841360769573, "5": 0.00026958360313712515, "1": 1.2533644116684354e-05}, "score": 3.020329194974717}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9780301805161458, "4": 0.0139666630454199, "5": 0.0071910549025006485, "2": 0.0005690651108888374, "3": 0.00023789265867518554}, "score": 1.071709428031046}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.35720940519260075, "3": 0.3233772437374424, "2": 0.317075393182326, "5": 0.0022869704154255487, "1": 5.0695926285182835e-05}, "score": 3.0446065739934203}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9626067152299201, "3": 0.030744806294095976, "1": 0.006269018974350243, "4": 0.0003763703221253097, "5": 2.931747196090994e-06}, "score": 2.0252373271787554}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8703240460133425, "2": 0.1296268941503948, "3": 4.8519731873807185e-05, "4": 4.053917311115491e-07, "5": 4.646362911394127e-08}, "score": 1.1297253470919881}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9814481538925978, "3": 0.01777198389694871, "1": 0.0005563444172563605, "4": 0.00022254193549103136, "5": 1.012890938894061e-06}, "score": 2.0176637613693447}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.894373916618659, "4": 0.054768076521591304, "2": 0.05061925709950583, "5": 0.00023711815423108952, "1": 7.479595036072748e-07}, "score": 3.0046215638953693}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5151099221632609, "3": 0.21526122249643606, "4": 0.16695476024517658, "1": 0.09427053484934561, "5": 0.008401303555451876}, "score": 2.480105202252566}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6515894977615038, "4": 0.2928229262283648, "2": 0.049714213542268904, "5": 0.0057446057208600495, "1": 0.00012869310744528684}, "score": 3.2543405540990458}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9409489835593303, "3": 0.0354421248067058, "5": 0.02247786571426802, "2": 0.0010720716295025245, "1": 5.785220437717533e-05}, "score": 3.9847180241933766}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9056507435780897, "3": 0.08494889827905765, "5": 0.0083690240687045, "2": 0.0010294286905453524, "1": 1.7584567151121615e-06}, "score": 3.9213559814834893}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8384811823584316, "3": 0.12062383227398754, "5": 0.030541731031569284, "2": 0.010268708680468112, "1": 8.415224156096018e-05}, "score": 3.88912798105336}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6413168746381689, "4": 0.35606125440351966, "3": 0.002588578488709316, "2": 3.226243524663171e-05, "1": 0}, "score": 4.638664429125271}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9979499839590824, "2": 0.0020492782930243134, "3": 7.450921015249169e-07, "5": 1.0477968733279544e-08, "4": 0}, "score": 1.0020508103525525}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9749138683893448, "2": 0.025074838144760886, "3": 1.0939341004865416e-05, "4": 1.6967584741957046e-07, "5": 6.927075677278093e-08}, "score": 1.025097505828028}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7395429120867476, "1": 0.13965798633577983, "4": 0.07554963662527286, "3": 0.02861929323364356, "5": 0.016627704981852728}, "score": 2.089943916961929}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9961485728441168, "1": 0.0036961335211609008, "4": 8.197797043708816e-05, "5": 6.188733521093323e-05, "3": 1.1191320896771432e-05}, "score": 1.9966646749557435}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8789718560105974, "2": 0.0764301902900978, "4": 0.023241077129204094, "5": 0.010783764100554793, "3": 0.010568430250660085}, "score": 1.2104263238433572}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7626992981728927, "1": 0.22758520118487804, "3": 0.009230962097352942, "4": 0.0004393253074763665, "5": 4.5115937161874556e-05}, "score": 1.782659738191654}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9940790811392308, "3": 0.003095498560608273, "1": 0.0028149108148670275, "4": 1.0369445590266523e-05, "5": 1.592365507101463e-07}, "score": 2.00030180434078}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6980208888139557, "5": 0.27657896806690596, "3": 0.019534874008937428, "2": 0.005860097718618991, "1": 4.195315551566653e-06}, "score": 4.245311552116803}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7317125012687206, "1": 0.26777020776246, "3": 0.0003275181777005894, "4": 0.0001605153470044629, "5": 2.88142644510629e-05}, "score": 1.7329646655579725}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9535683597632346, "1": 0.03694093474938243, "3": 0.00943076558051114, "4": 5.9004077870372164e-05, "5": 7.298797809470437e-07}, "score": 1.9726100229852679}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7143891050686164, "3": 0.14939831272827075, "5": 0.11987560486422787, "2": 0.016150628720650314, "1": 0.00018601095279316982}, "score": 3.9376179807720244}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8183750754712674, "5": 0.16991774703351759, "3": 0.011632861476776713, "2": 7.265153786769764e-05, "1": 9.785352756687516e-07}, "score": 4.158136755348341}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9907534625897112, "4": 0.009136678154529721, "3": 0.00010299099507632497, "2": 6.1633012916848385e-06, "1": 0}, "score": 4.990638843352207}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5774316203021405, "5": 0.4021032027709843, "2": 0.019315866931971137, "3": 0.0011474800520673237, "1": 1.0822655310746115e-06}, "score": 4.36232101295758}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6607967335252372, "3": 0.18656659982971746, "5": 0.13444322338891823, "2": 0.018176422350502115, "1": 1.6569133851171063e-05}, "score": 3.9114740314631096}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6622544045267865, "5": 0.3218398234195085, "3": 0.015589739585450128, "2": 0.00031138109814663725, "1": 3.831684631160834e-06}, "score": 4.305616077092931}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6826293131863919, "4": 0.3142915565000558, "3": 0.0022725709756298224, "2": 0.0007995144116692568, "1": 5.86674260874275e-06}, "score": 4.6787409128410395}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7419140708505527, "4": 0.2540328727657732, "3": 0.004043371521560908, "2": 7.605643655520831e-06, "1": 0}, "score": 4.73785702220762}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9717436566794514, "4": 0.028075274528732687, "1": 0.00010870432241503116, "3": 6.294627331129897e-05, "2": 8.45587577716788e-06}, "score": 4.971338620426225}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9338251442531427, "4": 0.04219236493584815, "5": 0.023942743174876217, "2": 3.3576907636449416e-05, "1": 0}, "score": 3.090044830020162}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9690545727982145, "5": 0.018068629882956107, "3": 0.012013551196028907, "2": 0.0008553900450593992, "1": 7.3749015867272616e-06}, "score": 4.004322175971777}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.9940483429993477, "4": 0.0031301166711405477, "2": 0.0028048607071796436, "5": 9.100347121037698e-06, "1": 7.5170634119426045e-06}, "score": 3.000328422551811}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6246157739307486, "5": 0.27429845872321257, "3": 0.05968620842071412, "1": 0.021671074066228938, "2": 0.019725378965275552}, "score": 4.1101486122831545}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.603444642545338, "4": 0.3865568239107426, "5": 0.00996838793157692, "2": 2.853334941143427e-05, "1": 0}, "score": 3.4064657217541012}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7632345423345068, "5": 0.11517624022952351, "3": 0.06496166190129953, "2": 0.030223521504159172, "1": 0.026402232711516052}, "score": 3.910560676076604}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6215892215051297, "3": 0.24627543867536877, "4": 0.1320582983142907, "2": 7.631683513812874e-05, "1": 0}, "score": 4.375161421027739}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.683073767581306, "1": 0.15797973716034022, "3": 0.11870880517997379, "4": 0.037804580743812606, "5": 0.0024329615958378695}, "score": 2.0436371207416655}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8879668213789377, "1": 0.11043060106363342, "4": 0.0013770116484167164, "3": 0.00013271175994734074, "2": 8.897785850730612e-05}, "score": 4.556366507349314}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6385462313144777, "5": 0.2336942597996001, "2": 0.10710533387651178, "3": 0.02065335299741397, "1": 3.613441531215189e-07}, "score": 3.998829154477332}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5456968921327261, "3": 0.3626233089169669, "4": 0.0903422719671565, "1": 0.0008936107323874642, "5": 0.00044380272825369913}, "score": 2.5437457120310314}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"2": 0.63378100639211, "1": 0.36041014657339154, "3": 0.005781983436837038, "4": 2.253157272819868e-05, "5": 4.189714352423916e-06}, "score": 1.6454294186928136}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7488596246892248, "3": 0.19156923408649634, "5": 0.05267245687509243, "2": 0.006862026998906934, "1": 3.651355487050594e-05}, "score": 3.8472696061642404}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7152984291083615, "4": 0.2178817270254012, "2": 0.05891069063240185, "5": 0.007089290599018615, "1": 0.0008193529619326953}, "score": 3.1715109990816766}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7434371643267891, "4": 0.12976071220464136, "3": 0.053586462934257985, "5": 0.03909111795782589, "2": 0.034120407953396256}, "score": 1.6869427825166294}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7801540724677013, "4": 0.21920134236480449, "3": 0.0006139242553801287, "2": 2.7975568003628136e-05, "1": 1.2464139121824635e-06}, "score": 4.779481579454161}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4804966127616841, "4": 0.375740264574778, "2": 0.13622485676125534, "1": 0.006371747590544972, "5": 0.001166018878921608}, "score": 3.229104064812364}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9212742618791244, "5": 0.06248625915069528, "3": 0.015798578679330325, "2": 0.0004346675812696635, "1": 5.486055767935914e-06}, "score": 4.045801921339701}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9875322238425229, "4": 0.01241046761470111, "3": 5.574069875602945e-05, "1": 0, "2": 0}, "score": 4.987478031355294}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7873448291869654, "4": 0.1974172835179881, "5": 0.008200210125330011, "3": 0.006825418644082597, "1": 0.00021158600481143553}, "score": 2.426049316578274}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5339678221412454, "4": 0.46301230434029567, "3": 0.0029913634265865655, "2": 2.6968716819843364e-05, "1": 6.194530039586139e-07}, "score": 4.530921152389923}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7093018801965583, "1": 0.2794404969798881, "3": 0.010724284818298912, "4": 0.0005127333671785698, "5": 2.048636530858338e-05}, "score": 1.7323706820154339}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.887423587438601, "1": 0.08045845618538246, "3": 0.03136426159609155, "4": 0.0007326698989564832, "5": 2.0834693583780406e-05}, "score": 1.9524336402428517}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7460649113725573, "4": 0.16352776280026698, "2": 0.0890829785814983, "5": 0.0011862727857564466, "1": 0.0001377990628784004}, "score": 3.076541752743897}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9587553884784108, "4": 0.041197014040426805, "3": 4.5883361553600245e-05, "2": 7.855874932738295e-07, "1": 0}, "score": 4.958708824133804}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5769568203632685, "3": 0.26354066408606697, "2": 0.12510691340583074, "1": 0.021253727228586712, "5": 0.013134262567220726}, "score": 3.4356142936827503}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6701019258721859, "2": 0.14142554275524785, "4": 0.12968903921263558, "5": 0.03297164926324276, "3": 0.025808561526231025}, "score": 1.7139987233929046}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.44835587413370265, "4": 0.3479566068299042, "5": 0.09402354023801661, "2": 0.06839921028234736, "3": 0.0412627303197819}, "score": 2.5708918541495724}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997297604212948, "4": 0.00026863284477084945, "3": 5.913616959833776e-07, "1": 1.2623974497637606e-07, "2": 0}, "score": 4.999729679232506}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7496351631049304, "4": 0.2226381435829883, "1": 0.014250033804851655, "2": 0.009854888031845878, "3": 0.0036181370958860873}, "score": 4.683559632845912}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998175716220805, "4": 0.000177974905134783, "1": 1.6213215008348004e-06, "3": 6.292406890132103e-07, "2": 0}, "score": 4.999814280918361}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9810911689749751, "4": 0.01875879443491813, "3": 0.00011810694858967638, "1": 2.2739501309124702e-05, "2": 6.978531849930718e-06}, "score": 4.9808930558100375}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997800373753263, "4": 0.00017091007790145563, "3": 4.8607850849055515e-05, "1": 0, "2": 0}, "score": 4.999731874101165}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8358263606854158, "4": 0.16368235320807312, "3": 0.00048217906922141805, "2": 8.393562625681056e-06, "1": 0}, "score": 4.8353279904763005}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4850864628577782, "5": 0.442092607331898, "2": 0.06058010743164017, "3": 0.00986365982728239, "1": 0.002375355900215533}, "score": 4.303943214060056}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.897727292487314, "5": 0.1021773040243885, "3": 7.182277009094605e-05, "2": 1.0336616156875414e-05, "1": 0}, "score": 4.102086160061505}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9143758112409447, "4": 0.08534449764082418, "3": 0.00021811066202603746, "2": 5.964978582230835e-05, "1": 7.034247016657726e-07}, "score": 4.914037412481636}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8402766299416896, "3": 0.09522194014781049, "5": 0.048071576581309686, "2": 0.016427722088031924, "1": 0}, "score": 3.919994021745402}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9375403425594598, "4": 0.062322123740977835, "3": 0.0001337979141104047, "2": 3.0466513150587486e-06, "1": 0}, "score": 4.9374010973378155}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5291567908596227, "5": 0.4665625705669431, "2": 0.0024694520377962505, "3": 0.0018079307856828446, "1": 1.4917628746698977e-06}, "score": 4.459812071519598}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9948659239520983, "5": 0.005126558513457119, "3": 5.99910659893771e-06, "1": 0, "2": 0}, "score": 4.00512056718207}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.44543528783816677, "3": 0.39262544018129275, "5": 0.10097812194612159, "2": 0.059113402714597967, "1": 0.0018468274571918116}, "score": 3.5845850118393345}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7122056464425939, "1": 0.2839774912851673, "3": 0.003748042407383053, "4": 6.726631275835036e-05, "5": 1.5472119324351607e-06}, "score": 1.7199097236077112}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.675298002736579, "4": 0.31642732013268055, "3": 0.008157985626324535, "2": 0.00011389449734044329, "1": 2.575597530728088e-06}, "score": 4.666904648982037}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9839796844767241, "4": 0.01599697719345614, "3": 2.264997069171695e-05, "1": 0, "2": 0}, "score": 4.983957711822304}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6151263716047904, "4": 0.3832600264226305, "3": 0.001582994931373918, "2": 3.0276976069084816e-05, "1": 0}, "score": 4.613483025210636}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.501784251279135, "3": 0.30502516426233267, "2": 0.16203163257539083, "5": 0.02978187773960518, "1": 0.0013767227816760587}, "score": 3.39656306795674}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4308699950475917, "1": 0.19163916961939623, "4": 0.1830682215969475, "3": 0.179113176856565, "5": 0.015309105452309828}, "score": 2.3995378992057166}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9830546728691278, "3": 0.01665260530536319, "4": 0.00029125977249976894, "2": 4.7167058884467836e-07, "1": 0}, "score": 4.966402081330219}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5807904607122161, "4": 0.4192038759307661, "3": 3.42447631044723e-06, "1": 0, "2": 0}, "score": 4.5807883365517075}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.723105924961944, "4": 0.25343735672482814, "3": 0.019270816998950304, "2": 0.0036826801141078497, "1": 0.000500970670755105}, "score": 4.694968399769339}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.997042251781505, "1": 0.0020461853994317575, "4": 0.0008976469665292966, "3": 8.293039578397199e-06, "2": 5.302999256568671e-06}, "score": 4.990885113443751}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9875959365391344, "4": 0.012384215014543488, "3": 1.91236647056801e-05, "2": 3.983869770092636e-07, "1": 1.4115207241436567e-07}, "score": 4.98757577558533}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9992065329615893, "1": 0.0006826890997848042, "4": 0.0001086979090492048, "3": 1.3326275009073963e-06, "2": 4.069827645270042e-07}, "score": 4.997156658520589}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99497802698455, "4": 0.005003087785789937, "2": 1.4240764024697064e-05, "3": 3.1582862608225914e-06, "1": 1.1318353944723835e-06}, "score": 4.9949433442162405}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9932521966616427, "1": 0.005138854933072895, "4": 0.0015870800462325387, "3": 1.0818012381370775e-05, "2": 9.80055540415779e-06}, "score": 4.977806434793178}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8735172512782612, "2": 0.12627631460889627, "3": 0.00020287662952482024, "4": 2.3996467954577496e-06, "5": 1.0429691088267719e-06}, "score": 1.1266934532377169}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.46204707460810973, "5": 0.2958562158322102, "3": 0.1864468998017945, "2": 0.05411289860572525, "1": 0.0015360370860259304}, "score": 3.996575404567564}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9563220827775185, "5": 0.04266847166401899, "4": 0.0009873193644472649, "3": 2.2069974347957427e-05, "1": 0}, "score": 2.130002131003976}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5743355911123553, "5": 0.35693699406181756, "3": 0.06677354565541055, "2": 0.001951401786098551, "1": 1.794390765575557e-06}, "score": 4.286255454309988}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5792331936929587, "4": 0.3376356916960521, "5": 0.056496629357426276, "3": 0.026181579185966617, "1": 0.00045228004563380115}, "score": 2.8704911155512725}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9937991418679011, "4": 0.005781104064034296, "2": 0.0002507314780630046, "1": 9.872207292528974e-05, "3": 6.998763320658399e-05}, "score": 4.992931835732147}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7891598740148525, "3": 0.07476657889992888, "5": 0.07330928550564812, "2": 0.062496982712820844, "1": 0.00026675151188524266}, "score": 3.872748419537682}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9511170205564458, "4": 0.0436995445120557, "3": 0.003412546814603602, "2": 0.0017706219675939112, "1": 0}, "score": 4.944163481095105}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6925524802760223, "5": 0.30610438737216084, "3": 0.0008083338533026477, "2": 0.0005332447745023866, "1": 0}, "score": 4.304230036659367}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9769466083496909, "4": 0.023018171724952685, "3": 2.7616338106504645e-05, "1": 4.125381737645107e-06, "2": 2.911746456296566e-06}, "score": 4.976901345748073}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9939587014755651, "2": 0.006037344596770851, "3": 3.858527206567532e-06, "4": 2.2894846394236462e-08, "5": 2.193044462465659e-08}, "score": 1.0060452183632398}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4895208125196044, "2": 0.46999956961087247, "4": 0.04015013805960043, "1": 0.00023513235255437457, "5": 9.400543107215194e-05}, "score": 2.5698681674893655}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9813317276784992, "4": 0.01860463566526733, "3": 6.213817646627789e-05, "2": 7.377933980356518e-07, "1": 1.8247311314685583e-07}, "score": 4.98126813387814}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7359759554591666, "5": 0.2040362101814253, "3": 0.05909050661764665, "2": 0.0008823853434797662, "1": 1.2453635122000747e-05}, "score": 4.143143928222788}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6015494715401233, "2": 0.30628887083561523, "4": 0.09062002172552638, "5": 0.0009207384931268534, "1": 0.0006208000553103431}, "score": 2.7849310068285136}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.39872433124835255, "5": 0.3292666401750974, "2": 0.251844763284626, "3": 0.02011606358018685, "1": 4.7843513896762894e-05}, "score": 3.8053174497490994}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7192124033040956, "3": 0.125253399208025, "1": 0.09979140715728475, "4": 0.049331685325909404, "5": 0.00641082378952833}, "score": 2.1433578743855515}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9805032330528245, "4": 0.019260972127042843, "3": 0.00021324474805677125, "2": 1.5959568542276146e-05, "1": 6.059465276364205e-06}, "score": 4.9802404113170144}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5615968698022563, "5": 0.3507044265058221, "4": 0.08283948991052226, "3": 0.00484322963900633, "1": 1.5451553646998925e-05}, "score": 3.2226206885778894}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4960411956302473, "4": 0.20897889771201952, "3": 0.14594979299663663, "5": 0.12091312094453055, "1": 0.028116021640007254}, "score": 2.8985318021574304}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7073330634689673, "1": 0.28421738314689876, "3": 0.00832116508248778, "4": 0.0001239314460097327, "5": 4.395448430780847e-06}, "score": 1.7243648142469143}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9082834767871979, "1": 0.08245439717381436, "3": 0.008995829481402175, "4": 0.000248475328263075, "5": 1.7666912819466136e-05}, "score": 1.927091372451568}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9434054322373456, "4": 0.029563334050595563, "3": 0.02016982506667165, "2": 0.006850566016333531, "1": 9.286034064514205e-06}, "score": 4.909508032771461}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9998250801202664, "5": 0.0001318227949220487, "2": 2.2364246783626e-05, "4": 1.4444598781917701e-05, "3": 5.781895429833643e-06}, "score": 1.000604553319789}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5946524867178515, "4": 0.392069444713645, "3": 0.011568407357700561, "2": 0.001651159187260705, "1": 5.787419239229693e-05}, "score": 4.579608502304725}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4197267393690512, "2": 0.3210652196531837, "3": 0.22414390508139703, "1": 0.030090420912100034, "5": 0.004973193947049811}, "score": 3.048427091018084}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8138035835066486, "3": 0.16080712717369816, "1": 0.024744674124805525, "4": 0.0006103661103083747, "5": 3.401955675619044e-05}, "score": 2.137385275473515}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.607428977540636, "5": 0.33941874428375746, "3": 0.0530810122196736, "2": 6.99945623252572e-05, "1": 0}, "score": 4.286198106809877}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.976560821893352, "4": 0.015547298272282118, "3": 0.003464971054689937, "2": 0.003438786952062065, "5": 0.000986276319225556}, "score": 1.0609558416497078}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7507821719174246, "3": 0.22634511204720095, "4": 0.011893919212631231, "1": 0.01091726279373721, "5": 6.121030501639026e-05}, "score": 2.239399396093103}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5028579773217613, "2": 0.3725039042535003, "3": 0.1204021848111558, "4": 0.004170593196212906, "5": 6.313703721456092e-05}, "score": 1.6260739810922946}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.66845810804888, "1": 0.32341543684518637, "3": 0.008066458827544242, "4": 5.940013849694457e-05, "5": 4.771828911227554e-07}, "score": 1.6847712163093542}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.444945400432913, "4": 0.3425814292166964, "5": 0.11011007849267233, "3": 0.10235334350925043, "1": 8.23272905353036e-06}, "score": 3.11783989891146}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9784113031381065, "5": 0.021571277382615744, "3": 1.6437701328165083e-05, "1": 0, "2": 0}, "score": 4.021554860843374}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6882769351628709, "4": 0.27937612130574635, "2": 0.02908726585685642, "5": 0.0017851466683200322, "1": 0.0014737192079552655}, "score": 3.2509119140594724}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9331010383002879, "1": 0.035964490583221015, "3": 0.029734285649695023, "4": 0.001189287369975881, "5": 1.0573295796647018e-05}, "score": 1.9961800884531042}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.76443840947825, "3": 0.23241595573832452, "4": 0.0026234225418796876, "1": 0.0005155106475084515, "5": 6.5158232052331625e-06}, "score": 2.2371668817028803}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7454851458944961, "3": 0.24333353615365158, "4": 0.007542717882824474, "1": 0.003600301813323121, "5": 3.799256785993331e-05}, "score": 2.2549327257393927}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8644083539039941, "3": 0.09296961124809379, "5": 0.02621138291924544, "2": 0.014752835166340917, "1": 0.0016535088058078507}, "score": 3.898775138848746}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8959879811430677, "3": 0.08834401715970236, "1": 0.014465236368045357, "4": 0.0011988845453802344, "5": 3.619372100760016e-06}, "score": 2.076287427941146}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"4": 0.625305380360023, "3": 0.24119122388760475, "5": 0.12261832461117385, "2": 0.010855129996479576, "1": 2.211509833775033e-05}, "score": 3.8596493970452688}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6099621944785868, "5": 0.38404290533223795, "3": 0.005265695728294444, "2": 0.0007182197336580412, "1": 8.370892904508156e-06}, "score": 4.377316643701105}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9782028513367199, "4": 0.02172103354725418, "3": 7.23970503807427e-05, "2": 2.3105198857182613e-06, "1": 0}, "score": 4.978127210005373}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5115535279971503, "5": 0.3996479677489922, "4": 0.08869955558454104, "2": 9.778992525327295e-05, "1": 0}, "score": 3.8878987300046544}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994955883583476, "4": 0.0005031450800145134, "3": 4.1813855000502597e-07, "2": 3.125076150208908e-07, "1": 0}, "score": 4.999495080849445}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.63990004148902, "2": 0.2378459223592533, "4": 0.12203391269089425, "1": 0.00012751583563745894, "5": 9.236023768673205e-05}, "score": 2.884117650467894}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7225954550543816, "5": 0.17281172014482596, "3": 0.09561678490653605, "2": 0.008801773884746069, "1": 0.00017276504637114931}, "score": 4.059073180996352}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5076360627798221, "3": 0.3089592771277308, "4": 0.17621909503218866, "1": 0.005739967676145815, "5": 0.0014435253464387906}, "score": 2.659989443078269}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5969444311932873, "4": 0.20618204228773432, "3": 0.19122552276668736, "1": 0.0036032592351454124, "5": 0.0020438467193211363}, "score": 2.606118432436784}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9813669816727127, "2": 0.018159961969531072, "5": 0.00038936825157551364, "4": 7.292040894772266e-05, "3": 1.0514019509449718e-05}, "score": 1.0199572293043995}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7172314049040937, "3": 0.14054385551735413, "4": 0.13757546170747073, "5": 0.003254055221451496, "1": 0.0013947204193937735}, "score": 2.4240624371542348}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9901119187506547, "2": 0.009884276665490497, "3": 3.518358543450425e-06, "5": 1.0272647125616169e-07, "4": 0}, "score": 1.0098917261035827}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5915738803394932, "5": 0.3911959475103512, "3": 0.01638244408745224, "2": 0.0006693473666031404, "1": 0.00017752306745492716}, "score": 4.37294255933355}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9568256892630858, "4": 0.03327228868714207, "1": 0.009157729520149526, "3": 0.0006001577623860503, "2": 0.00014302473079998295}, "score": 4.928467324111211}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9188644176420927, "3": 0.059030141065903256, "2": 0.01771801075469278, "5": 0.004370451312655267, "1": 1.6660731743687534e-05}, "score": 3.9098542778313625}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5281965028622885, "4": 0.4679275980752279, "3": 0.0038251163265352493, "2": 5.057323875176479e-05, "1": 1.073580851143828e-07}, "score": 4.524269971532463}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9203711098530019, "4": 0.07839263479344075, "3": 0.0011342030877325284, "2": 9.0918323357915e-05, "1": 1.087225963858718e-05}, "score": 4.919022693832097}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7077145673762378, "3": 0.19803335557021062, "5": 0.0908539506200091, "2": 0.0033884794433479528, "1": 9.364374645549076e-06}, "score": 3.8860155108253767}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7363860082554596, "4": 0.2561219194553854, "3": 0.007168465958866818, "2": 0.0003218451592404232, "1": 0}, "score": 4.728575135123545}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9565167227330821, "4": 0.04346000018052647, "3": 1.7087916186752293e-05, "2": 5.031980066104271e-06, "1": 0}, "score": 4.956490677698343}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9179151746252658, "5": 0.05427097637529624, "3": 0.027622530964202995, "2": 0.00017596208715906, "1": 0}, "score": 4.026296925050991}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5252867368794136, "2": 0.44170347194333953, "4": 0.03136221984912122, "1": 0.0015886161303533554, "5": 5.863961886386654e-05}, "score": 2.586598664422061}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5080983082241397, "5": 0.45519758570299373, "3": 0.016298878128670535, "1": 0.016217814182677082, "2": 0.004181906650336236}, "score": 4.381883554800814}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9999566555993957, "4": 1.601568505472545e-05, "3": 1.535578932980491e-05, "1": 9.43926916278868e-06, "5": 2.2926573461296936e-06}, "score": 2.0000448258731183}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8535266353747117, "5": 0.06823437560430054, "4": 0.05467226153010778, "2": 0.01859165230147982, "3": 0.004970686597623609}, "score": 1.4654893553470094}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"3": 0.972234017261392, "4": 0.015129840397223539, "2": 0.012592939238398068, "5": 4.134305942660144e-05, "1": 1.350217996042762e-06}, "score": 3.0026168881758424}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8991342581531243, "4": 0.09871625056961418, "5": 0.0021403305484154625, "2": 7.2853214090300786e-06, "1": 0}, "score": 3.1029898194929095}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8591793409798714, "3": 0.11536096965626787, "5": 0.02452183828215961, "2": 0.0009347872450210586, "1": 2.2925587639833416e-06}, "score": 3.9072843449500207}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9329053259555032, "2": 0.030238153229159008, "3": 0.028477291465447644, "5": 0.008372924942753572, "1": 5.253111448790586e-06}, "score": 3.9194034829538706}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9978512196410116, "4": 0.0014618440387302572, "2": 0.0006145229390729478, "5": 7.058661645934417e-05, "1": 0}, "score": 3.0009884961383255}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6615266956536979, "2": 0.2162617066148998, "3": 0.11089179199876584, "5": 0.011312868453628522, "1": 6.840067212426156e-06}, "score": 3.467877091294802}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8525784078808808, "4": 0.14684825562877346, "3": 0.0005435064412757048, "2": 2.490362955139621e-05, "1": 2.39991797086676e-06}, "score": 4.851980046955497}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5274939620753917, "1": 0.3927710919665099, "2": 0.051221311157136594, "4": 0.026472696444141845, "3": 0.0020323886556721823}, "score": 3.2446992176099503}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9898398248739758, "1": 0.010098952231213976, "3": 3.941827565868386e-05, "4": 1.7313344420757128e-05, "5": 3.909293073224742e-06}, "score": 1.989986814785016}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9460048548184821, "1": 0.03624155827403962, "4": 0.01734096426310966, "2": 0.00033863964840774645, "3": 6.586739524288235e-05}, "score": 4.836543822359951}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4045075611802808, "1": 0.35741882699004696, "5": 0.1972804220940523, "3": 0.028789705605273525, "2": 0.01200117760810756}, "score": 3.0722297403796865}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9808745758054942, "3": 0.01109362122789703, "5": 0.005318189782392126, "2": 0.0027136038326009567, "1": 0}, "score": 3.98879736078453}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7446083079532535, "2": 0.09939259152886654, "4": 0.08055723124644716, "5": 0.06911182044211216, "3": 0.006324694790495194}, "score": 1.630164330541939}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7717129689276624, "2": 0.10042133442754166, "3": 0.06903574949041742, "5": 0.04317692370279504, "1": 0.01565176325956131}, "score": 3.7263428707180792}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5545823894005415, "4": 0.4248766276847363, "1": 0.010811974597970363, "3": 0.007511365541310723, "2": 0.0022136195450487986}, "score": 4.5102099136672535}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9022721058101486, "1": 0.07537438373160393, "3": 0.02198323855210852, "4": 0.00032988481826217727, "5": 4.0228655214140534e-05}, "score": 1.9473893020874185}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9998008899750327, "2": 0.00019861724049002698, "3": 4.142061666492614e-07, "5": 1.8415594575612853e-08, "4": 1.0011183688609445e-08}, "score": 1.0001995493587605}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6643461866052859, "4": 0.30814753529484956, "2": 0.024026752066005054, "5": 0.0034742939516166577, "1": 4.0361996072244675e-06}, "score": 3.2910616468084326}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.8856847095547437, "4": 0.05562752201099679, "1": 0.023547526403056598, "5": 0.01858355182462895, "3": 0.016555465334197134}, "score": 2.160013834423547}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7151785265302206, "2": 0.28434707269702747, "3": 0.00045767766950120467, "4": 1.3152259355399899e-05, "5": 3.022914880069101e-06}, "score": 1.2853141328055082}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5791620045161423, "2": 0.26241559277303367, "4": 0.15816744953037923, "1": 0.0002328716766744906, "5": 2.169944226113525e-05}, "score": 2.8953294722979392}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.42710891415466123, "5": 0.4100092904116079, "1": 0.12263887716463458, "2": 0.020533121781764332, "3": 0.01970102921867705}, "score": 3.981325222408706}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8429847173749073, "3": 0.11451418238887676, "2": 0.028948806559782676, "5": 0.013016506450247944, "1": 0.0005348249825549698}, "score": 3.8390000810729936}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9323339117981324, "2": 0.0645608944863164, "4": 0.0021120773283633217, "3": 0.00091973929783231, "5": 7.240052552256382e-05}, "score": 1.0730262784839837}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9507946788589801, "4": 0.049129186060284005, "3": 7.390108855576488e-05, "2": 1.484705680948857e-06, "1": 0}, "score": 4.950718520719614}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7410908400790053, "2": 0.2586383564941429, "3": 0.0002646704740260143, "4": 4.414848673648823e-06, "5": 1.64238352884994e-06}, "score": 1.2591875311481728}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4817843074520621, "3": 0.3491953399629223, "4": 0.14958439954436037, "1": 0.014510241043370562, "5": 0.0049249359968794515}, "score": 2.6486292093354398}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9960420100718906, "4": 0.003566413892341491, "1": 0.00033760249664309037, "3": 3.251952109074368e-05, "2": 1.8447512876615707e-05}, "score": 4.994962779395845}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9477806332778957, "4": 0.05205356471015761, "3": 0.00014041025889349347, "2": 2.0517692402579513e-05, "1": 2.736833398148741e-06}, "score": 4.947593002355592}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5014413437679739, "4": 0.4963391379688518, "3": 0.0019689251387143645, "2": 0.00021069077937013741, "1": 3.793070938348681e-05}, "score": 4.498938228666796}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7408271327785189, "2": 0.14840355396268579, "4": 0.10665360846405267, "5": 0.003856001551013991, "1": 0.00025941382277793054}, "score": 2.965443219956383}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.893310816386955, "4": 0.08809988952619355, "3": 0.017855476698005766, "5": 0.0007329504919768991, "1": 6.586161141660637e-07}, "score": 2.1962534894860344}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.84498128483035, "5": 0.06997538791312907, "4": 0.054002388603391044, "2": 0.02222302645389283, "3": 0.008812791794141298}, "score": 1.4817597943101708}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.4644174985308241, "5": 0.4529381939517991, "4": 0.06028064531434733, "2": 0.016263194995121633, "3": 0.006094221206577771}, "score": 3.0210589726955477}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9921172967458808, "1": 0.006310039768452406, "4": 0.0007211953602721672, "5": 0.000665704086982911, "3": 0.0001855446507555288}, "score": 1.997315007274742}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"3": 0.9987392508128708, "2": 0.0008631771635004476, "4": 0.00021794212763122682, "5": 0.0001784708991513205, "1": 8.608345596952158e-07}, "score": 2.999709985006842}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5737675958095448, "3": 0.34914324390466234, "4": 0.055941767240108096, "1": 0.020653949887940618, "5": 0.00048804204404129535}, "score": 2.441839341053581}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6064555152191926, "4": 0.22517592351489782, "2": 0.14080321524106415, "3": 0.027562817681006192, "1": 1.610609305405228e-06}, "score": 4.297281708053832}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.9142595374624541, "1": 0.06270995951614325, "3": 0.014158969058078067, "4": 0.008037798915508598, "5": 0.0008333996157826209}, "score": 1.9700247961656563}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6378916740140003, "2": 0.253249350630692, "4": 0.07632957508518302, "5": 0.021539397044688113, "3": 0.01098577527336043}, "score": 1.5903697106665582}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"2": 0.562320166511123, "4": 0.2194136758785491, "3": 0.16693641292522934, "5": 0.04887440180672992, "1": 0.0024544187683564153}, "score": 2.7499332443549807}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6047040585804059, "2": 0.1876973225517382, "5": 0.12868779523444562, "4": 0.04742899634878335, "3": 0.03147951066083208}, "score": 1.9076966166491154}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9098671583158794, "4": 0.05898894650505959, "5": 0.03049038167565928, "2": 0.0006500471235065745, "1": 2.3094018646764908e-06}, "score": 3.1193151819741867}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7968936715062832, "2": 0.18145503445870984, "3": 0.016705354202767038, "4": 0.0032892338949449323, "5": 0.0016520168569012985}, "score": 1.2313425967607186}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9972654410365457, "4": 0.0027242219896977545, "3": 5.737121237541641e-06, "2": 2.5746576091754895e-06, "1": 0}, "score": 4.997256574239028}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8579711283517775, "3": 0.14040121971491393, "1": 0.0010157345841771898, "4": 0.0006113848059863075, "5": 4.2959969659586125e-07}, "score": 2.140609558016632}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9808234402233219, "2": 0.019078782982130293, "3": 8.827434819303218e-05, "4": 8.364868030831699e-06, "5": 8.510601749528666e-07}, "score": 1.019283836048478}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9462187971925614, "3": 0.027360040663222476, "4": 0.024374799201971345, "1": 0.0016263012734419797, "5": 0.0004197284094575724}, "score": 2.075742548264008}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9992757945634348, "2": 0.0004716107475568434, "4": 0.00011103922951896287, "5": 7.551275315603642e-05, "3": 6.533537094202895e-05}, "score": 1.001237451065915}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9983769618533141, "4": 0.0008964428633207855, "3": 0.0007060863635344553, "5": 1.7873506952601083e-05, "1": 2.5207880174141162e-06}, "score": 2.002550072115318}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.871004330735678, "1": 0.10803862250501782, "3": 0.02037821990894799, "4": 0.0005741243198450314, "5": 4.615238555559069e-06}, "score": 1.9135016842086796}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9844954062381784, "3": 0.014158480582071824, "5": 0.0011721902167681302, "2": 0.00017286666209050905, "1": 8.041283027212426e-07}, "score": 3.986665560563027}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9319585309269853, "2": 0.06141178648223814, "5": 0.004787882653717341, "4": 0.0018413074298282322, "1": 2.1903594241057257e-07}, "score": 2.950004834510898}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5916125350396699, "3": 0.40799488149992086, "1": 0.0003853789970369518, "4": 5.445418200658588e-06, "5": 1.6824516716009272e-06}, "score": 2.4076254719157615}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9953307814523439, "3": 0.003235599666152352, "5": 0.0014311652591433425, "2": 2.350709172033077e-06, "1": 0}, "score": 3.9981908639884636}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.932202325882449, "1": 0.045198517109231985, "3": 0.022227333693777655, "4": 0.00036707161232277116, "5": 4.2299389399934585e-06}, "score": 1.9777756380301554}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.602986620938162, "2": 0.3954844934507806, "3": 0.0014417220670401687, "4": 8.517445440623621e-05, "5": 1.9609804111787165e-06}, "score": 1.3986313160749317}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9990981184398671, "4": 0.0008963517893525083, "3": 1.4644116503739077e-06, "1": 0, "2": 0}, "score": 4.999100715731433}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9944479379830949, "4": 0.0055453180602286194, "3": 4.884896304614244e-06, "2": 5.122423418313325e-07, "1": 0}, "score": 4.994443367936364}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.953996823694581, "1": 0.036818372708945515, "4": 0.009003562019515271, "3": 0.0001336170079432328, "2": 4.331766666706195e-05}, "score": 4.843325085345258}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5956472556899771, "2": 0.39330101060310035, "3": 0.010826413892466809, "4": 0.0002198722196776569, "5": 4.9650906640471206e-06}, "score": 1.4156335159546045}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8842383818240981, "3": 0.07838607360449815, "1": 0.03644457010270794, "4": 0.000919497714052188, "5": 1.134104627286099e-05}, "score": 2.0438145280147113}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9517855501629887, "1": 0.025037804908286224, "3": 0.02290675806385908, "4": 0.00026853722849881726, "5": 1.243916112005806e-06}, "score": 1.9984097591927859}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7620172010453053, "3": 0.2208765347204322, "5": 0.011602020674066163, "2": 0.005492515124748333, "1": 1.0347537388932713e-05}, "score": 3.7797091088927064}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5852196512500665, "3": 0.26235267305826204, "2": 0.11947494438654085, "5": 0.03212112068325301, "1": 0.0008312021762334465}, "score": 3.5283247596695118}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7809800918939928, "3": 0.18355344508949278, "4": 0.025050655102420046, "1": 0.009845010503547972, "5": 0.0005706846942718613}, "score": 2.22552182429358}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9869765003512809, "4": 0.012886216850856242, "1": 7.533279450305447e-05, "3": 5.637098399602464e-05, "2": 4.923115481091984e-06}, "score": 4.986684931923292}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9824220468646705, "4": 0.017188246014797265, "3": 0.000388981800806261, "2": 2.808584587586841e-07, "1": 0}, "score": 4.982032939822552}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.620488380835192, "4": 0.3113424646937719, "3": 0.03229719805627672, "2": 0.023168260937529394, "1": 0.012702429558435679}, "score": 4.503748009932623}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8482547038288638, "4": 0.14817862608046503, "3": 0.003355560696060992, "2": 0.00019324958847393383, "1": 1.7053586916950808e-05}, "score": 4.84446216401673}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8601063711495841, "2": 0.1394817375375477, "3": 0.0003980459926238093, "4": 7.96287056001028e-06, "5": 5.876730430154094e-06}, "score": 1.1403252258587515}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996032523251821, "4": 0.00033759621729505067, "1": 4.349841749311525e-05, "3": 8.199035766987578e-06, "2": 6.383232037056973e-06}, "score": 4.999452861759228}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5528475796245298, "5": 0.36961644727566184, "3": 0.05328315708005209, "2": 0.024082101277355585, "1": 0.0001691039404242119}, "score": 4.267662206970439}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8652973274121072, "4": 0.13106713580454923, "3": 0.003409978475079624, "2": 0.00022132706905916556, "1": 3.7115499214537967e-06}, "score": 4.861434007827167}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7973657476490918, "1": 0.11181624776211493, "5": 0.04494449926860157, "4": 0.03616872441575891, "3": 0.009703462484518468}, "score": 2.1050582998706804}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5862560320872238, "1": 0.17579948907866286, "3": 0.10112582959280488, "2": 0.07607302840492056, "5": 0.06074517644476534}, "score": 3.280074502877271}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8155071739206855, "4": 0.1840172087373397, "3": 0.00040063943489471193, "2": 4.6020850151744186e-05, "1": 2.8574181288926963e-05}, "score": 4.814929082258114}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7979859725060893, "1": 0.13090302461901981, "4": 0.06453846992694334, "3": 0.0037436788548273208, "2": 0.0028275264371750743}, "score": 4.395878692510553}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7089653253949887, "1": 0.1913479080030158, "5": 0.07156794505666952, "3": 0.01954171631983407, "2": 0.008573990661258746}, "score": 3.4608328441345315}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.534985090873824, "1": 0.4059710205027437, "4": 0.057328752057688226, "3": 0.0009446532774168545, "2": 0.0007674427301378005}, "score": 3.314590406600148}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9059136377992697, "1": 0.07361229614602871, "3": 0.020045183069569254, "4": 0.0004247473654590164, "5": 4.1085516013386235e-06}, "score": 1.9472947058826318}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7922494774408718, "3": 0.18138705599385888, "4": 0.016782620870540593, "1": 0.009335200723220161, "5": 0.0002456612508678725}, "score": 2.206354077405012}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9988009644182927, "4": 0.0007563676427926373, "3": 0.0004419913262269745, "1": 0, "2": 0}, "score": 4.998359648594871}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7284012828072631, "4": 0.2698858195453434, "3": 0.0017118065570911572, "2": 6.47104526404744e-07, "1": 0}, "score": 4.726688504680479}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6453879694458324, "4": 0.3457037446615419, "1": 0.004257280937793211, "3": 0.0034356058270306055, "2": 0.001212059863776401}, "score": 4.6267584939899615}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9600818027044983, "4": 0.03909376842547327, "1": 0.0004955653628389634, "3": 0.00022499261016732457, "2": 0.00010288836422421499}, "score": 4.958165278706177}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8772657419703689, "5": 0.11112265363685073, "4": 0.010132852611682104, "2": 0.0010475177093606587, "3": 0.0004167286364145247}, "score": 1.4767770632234936}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.517322607524454, "4": 0.48047172368177576, "3": 0.0021805583742522633, "2": 2.4271590664863414e-05, "1": 0}, "score": 4.515093938044529}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.768447779128008, "5": 0.22967739157794312, "3": 0.0013540989871003981, "2": 0.0002611966463603233, "1": 0.00025698290314745385}, "score": 4.227030529688492}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9415594019420024, "4": 0.05612287475035796, "2": 0.0015138427398537781, "1": 0.00042711126709652094, "3": 0.00037495970166312855}, "score": 4.936877118331263}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8997379632457054, "2": 0.10014236053594631, "3": 0.00011695152795402265, "4": 2.093370733479531e-06, "5": 6.200399038065793e-07}, "score": 1.1003850249959888}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8966184372091953, "3": 0.055582198491915195, "1": 0.039738034582058816, "4": 0.007746950476162176, "5": 0.00031417952492641884}, "score": 2.032280609883906}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.577164244769466, "5": 0.41861047725805844, "3": 0.00409863207986125, "2": 0.00012230128602442288, "1": 2.4458202762335416e-06}, "score": 4.4142606917378515}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992001010898376, "1": 0.0006234425114888149, "4": 0.00017533467181464178, "3": 3.1569414109881113e-07, "2": 0}, "score": 4.997330261742052}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9386832346290267, "2": 0.040487447142983364, "4": 0.014202512406357745, "3": 0.005859051198623464, "5": 0.0007669806385542883}, "score": 1.097881085071959}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8767954694005621, "5": 0.09986876548730493, "3": 0.022113101899302122, "2": 0.0012045012477534564, "1": 1.792496722378369e-05}, "score": 4.07529290403508}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7793493297959777, "4": 0.22026960624263175, "3": 0.0003787735594147419, "2": 1.9532517697811646e-06, "1": 0}, "score": 4.778966912361879}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.927431751960321, "5": 0.0418804980809559, "3": 0.030518872995519506, "2": 0.00016798447391573308, "1": 3.758386154214489e-07}, "score": 4.011024534317592}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6961535884027249, "4": 0.30358334297561784, "3": 0.00014663324803347957, "2": 0.00011479105445279663, "1": 0}, "score": 4.695778517127741}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9996709061132767, "4": 0.00026481237542626984, "5": 3.645798705207281e-05, "3": 2.7639600855433212e-05, "1": 1.23958872468298e-07}, "score": 2.000666514393959}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9060667773236892, "5": 0.06794229751485102, "3": 0.02577117138439338, "2": 0.00021640887496064183, "1": 0}, "score": 4.041738447991559}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8848352141605319, "5": 0.0915426403955622, "3": 0.02354330000139814, "2": 7.790285158851279e-05, "1": 7.328168718784055e-07}, "score": 4.067841350471726}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8613913570676962, "3": 0.12279502219033761, "5": 0.0133538773246629, "2": 0.002451261963241369, "1": 7.575546984506671e-06}, "score": 3.8856335009614678}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9839824524154696, "4": 0.015995284802798118, "3": 9.570950850653282e-06, "1": 0, "2": 0}, "score": 4.983985370040526}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9063334448284512, "4": 0.0929026786393984, "3": 0.0006369730569935907, "2": 0.00012381308606853735, "1": 1.5112703038064505e-06}, "score": 4.905445741594788}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8022992588536755, "5": 0.16432488576663978, "3": 0.01277950708532444, "1": 0.010579014545896968, "2": 0.010016946202368558}, "score": 4.099774481306098}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6695986004081439, "3": 0.15181752085938519, "5": 0.12406427511143328, "2": 0.052789445715649606, "1": 0.0017299599863800869}, "score": 3.8614779554454635}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979308682106333, "4": 0.0020073201604336303, "1": 5.070500166821048e-05, "3": 7.233207373785239e-06, "2": 3.476272357220015e-06}, "score": 4.997764963713434}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9968510184754876, "4": 0.002160598526647153, "1": 0.0009777870029925102, "3": 5.120164451474821e-06, "2": 4.3061427851164685e-06}, "score": 4.993905087574981}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.957715744195048, "4": 0.042232023289299855, "3": 4.819563987617021e-05, "2": 1.6632849923611715e-06, "1": 0}, "score": 4.957666495093553}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7960159544975408, "1": 0.19165404139597617, "3": 0.012159725216825174, "4": 0.00016904391917976243, "5": 1.0473587909634997e-06}, "score": 1.8208468801243625}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6635490910027336, "4": 0.2848081452382154, "2": 0.04626303578159954, "1": 0.004199051552615521, "5": 0.0011802047955650336}, "score": 3.23250752559987}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8621021343607329, "4": 0.13668043077982492, "3": 0.0006494333789109185, "1": 0.0004956041671260414, "2": 7.013721642674814e-05}, "score": 4.859827557341254}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.742235144265996, "3": 0.22992277208200598, "5": 0.02691813112248993, "2": 0.0009204768564274433, "1": 1.3356386379668763e-06}, "score": 3.7951499600255736}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5155608199707641, "5": 0.48327997252633076, "3": 0.0011554677946415003, "2": 2.6168820660247688e-06, "1": 0}, "score": 4.4821198123043136}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9299134980595419, "2": 0.06985853572204306, "3": 0.00021429864037469338, "4": 1.1411214021151392e-05, "5": 2.209301844080125e-06}, "score": 1.0703302071621248}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4719356204741826, "3": 0.3458766051663816, "4": 0.16614406592273268, "1": 0.012836066179178986, "5": 0.0032071348837119464}, "score": 2.67495041793597}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5063839818856017, "5": 0.48743820770683793, "3": 0.006015735857283933, "2": 0.0001501200876246875, "1": 9.717375366282442e-06}, "score": 4.481094155797824}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7376215948393535, "2": 0.19446484067536599, "3": 0.037403144520790986, "4": 0.028088939281683132, "5": 0.0024196025205748864}, "score": 1.363217039824823}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3988618351020691, "3": 0.34285152405795455, "4": 0.24732755185633504, "5": 0.007649754677182879, "1": 0.0033083109726386186}, "score": 2.85714845797854}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4407711819420811, "3": 0.32748962624378786, "2": 0.15437562855451345, "5": 0.04451524785827374, "1": 0.03284358942417576}, "score": 3.30974033408151}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7698545100302457, "5": 0.15860746544302537, "3": 0.0673725037858497, "2": 0.004062581784336228, "1": 0.0001025833929925164}, "score": 4.082802077350926}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5536011153272392, "3": 0.2374124868102599, "2": 0.11001730581204984, "5": 0.09616896331777508, "1": 0.0027990757656136717}, "score": 3.6303242483301843}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8248105131982403, "5": 0.09724273535437897, "3": 0.07676850608126244, "2": 0.0011497345377419633, "1": 2.6383598759058266e-05}, "score": 4.018095647894954}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7023377115848611, "4": 0.29587393815031665, "3": 0.0017652529224935097, "2": 1.767859450921292e-05, "1": 0}, "score": 4.70054089752781}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7168417098854727, "4": 0.28309906205283236, "3": 5.874197558828537e-05, "2": 2.3689543398168137e-07, "1": 0}, "score": 4.716782672734572}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6250925376284787, "3": 0.23162794035364598, "2": 0.08972685211794174, "5": 0.05273783232807405, "1": 0.000814699356914917}, "score": 3.6392120398015115}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9625394467727548, "4": 0.037458778148380965, "3": 1.0453895153884743e-06, "1": 0, "2": 0}, "score": 4.962539103737771}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987451998209359, "4": 0.0012371453381897022, "1": 8.924145296342764e-06, "2": 4.878162236053747e-06, "3": 3.0945780311747675e-06}, "score": 4.998706333457314}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9894851070877291, "4": 0.010514237372892964, "3": 2.2565286818168106e-07, "1": 0, "2": 0}, "score": 4.989485306801245}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8842691405911786, "3": 0.0692017588343606, "1": 0.030199044324081114, "4": 0.015510066720963632, "5": 0.0008198333254604653}, "score": 2.072482359250619}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.43800791412079093, "3": 0.41039186805610395, "2": 0.1484940928972892, "5": 0.0029537580621628004, "1": 0.0001522543622342239}, "score": 3.295116861824424}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9462946964461831, "4": 0.05330834998227716, "2": 0.00020719690188152003, "3": 0.00018931845760227636, "1": 0}, "score": 4.945691398598191}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996383820995198, "4": 0.0002655349732416849, "1": 9.2800920410937e-05, "3": 2.2350677883516907e-06, "2": 4.42931369953935e-07}, "score": 4.99935746202733}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939758981038183, "4": 0.006009795245402445, "3": 1.0180901446760061e-05, "2": 2.8297505360505794e-06, "1": 7.671879653173665e-07}, "score": 4.993958281753308}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4478945292792929, "3": 0.23995614536085103, "4": 0.199579365441582, "1": 0.09757997312592974, "5": 0.01498879585471281}, "score": 2.5865019891695136}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7321753533151591, "2": 0.2675958390471798, "3": 0.00022815735809095613, "4": 5.378839534275493e-07, "5": 3.6660461718555284e-08}, "score": 1.2680539343581751}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7515425284298407, "3": 0.20577325917626227, "4": 0.026559786309030532, "1": 0.015876704021926973, "5": 0.0002473641538438089}, "score": 2.2437583074772434}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5592570570032287, "5": 0.4371894735223134, "3": 0.003552152220144648, "2": 5.593759777420889e-07, "1": 0}, "score": 4.433636531193946}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5168347179884071, "4": 0.29809579035039074, "2": 0.17284872309513344, "3": 0.01201013142483093, "1": 0.00021010419156061925}, "score": 4.158496912269505}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.888253680987576, "2": 0.11006647252731294, "3": 0.0015778402459364028, "4": 9.04787085118491e-05, "5": 1.1568577171391869e-05}, "score": 1.1135398587929919}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9997819442176188, "5": 0.00014521066614102255, "2": 3.8730738372707056e-05, "4": 1.9888099901571357e-05, "3": 1.4099333939912408e-05}, "score": 1.0007074364603261}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7801397879774093, "4": 0.08558926607648154, "3": 0.06004626083031088, "5": 0.03995825479317435, "2": 0.03426374434591069}, "score": 1.5709586169902239}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9999881244990143, "2": 5.606544398304257e-06, "5": 2.9197603995482633e-06, "3": 1.8810263485655018e-06, "4": 0}, "score": 1.0000210476695952}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6372818733184145, "4": 0.35652536200116053, "3": 0.003903609660239037, "1": 0.0020251196373418175, "2": 0.00025934093773455786}, "score": 4.626787165288622}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9793944054029923, "1": 0.0190680007939831, "3": 0.0015291814297251286, "4": 8.142445443771882e-06, "5": 3.803764183180423e-07}, "score": 1.9824786085910973}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.948989561410637, "2": 0.05096555839403613, "3": 4.465599469354157e-05, "4": 1.6701219554173388e-07, "5": 3.150624678943789e-08}, "score": 1.0510554987562142}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9262133141609415, "3": 0.07222604962681696, "4": 0.0010298878151526905, "1": 0.0005196202508526216, "5": 1.1136706650308715e-05}, "score": 2.0737996144944653}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6845432989060176, "3": 0.3096763063797101, "4": 0.00431774242555159, "1": 0.0014187411707696318, "5": 4.36445124783383e-05}, "score": 2.3170240681178305}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8159902031775229, "2": 0.10812665580974468, "4": 0.07540987834624142, "5": 0.00041215997299871507, "1": 6.067523095082342e-05}, "score": 2.9679861783358827}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9091375373815176, "3": 0.08030699909477175, "2": 0.0064109763689502094, "5": 0.004137059538075761, "1": 6.871981949219815e-06}, "score": 3.9109874423010873}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8274337709827988, "3": 0.08939046124307554, "5": 0.058659038889163656, "2": 0.024515536979473174, "1": 1.1582943764765462e-06}, "score": 3.920234026122989}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7776081849330784, "5": 0.21926292467070466, "4": 0.002880115158625018, "2": 0.0002452643376160671, "1": 0}, "score": 3.4411622490389484}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9679135398804477, "4": 0.03208238992017967, "3": 2.8664907830649074e-06, "1": 0, "2": 0}, "score": 4.967911838473459}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976990731996619, "4": 0.0022343198833003094, "1": 3.615295029873027e-05, "2": 2.399087519785699e-05, "3": 5.7414888484685805e-06}, "score": 4.997537610935348}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6454323994829134, "3": 0.3372122246841045, "4": 0.016646088751019552, "1": 0.000679770375438909, "5": 2.955235860113811e-05}, "score": 2.369913275698331}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9932147941699402, "1": 0.004673032782442949, "3": 0.002105040230824045, "4": 7.12217073852664e-06, "5": 4.2745325182465764e-08}, "score": 1.9974463801078033}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9280154385182477, "5": 0.0657647038649094, "4": 0.0058421172794240975, "3": 0.000351903347864692, "1": 2.4950916574215763e-05}, "score": 2.209305484044801}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5548702368779707, "3": 0.4433254626558048, "5": 0.0017810900757732429, "2": 2.2474358968350032e-05, "1": 0}, "score": 3.5584103536781493}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9971950238176186, "2": 0.0011402588282743778, "4": 0.0008623506357478209, "5": 0.0006617864745853345, "3": 0.00013986092807048023}, "score": 1.0066541832764586}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8468588374720862, "5": 0.11481249035653031, "3": 0.03500534902094689, "2": 0.003308591529304532, "1": 1.452176499246587e-05}, "score": 4.073146408332219}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9551891139760295, "4": 0.04014548894280218, "2": 0.002618271268945462, "3": 0.001505877190111945, "1": 0.0005393192833511976}, "score": 4.946830563154878}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9942869339856818, "4": 0.005685597819297569, "3": 1.9023909027751012e-05, "2": 7.574452397053263e-06, "1": 5.704541722318134e-07}, "score": 4.994251347467739}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.771092067074445, "1": 0.222361442875789, "4": 0.0060065147928435, "2": 0.00038702111720577274, "3": 0.00015085129616295454}, "score": 4.103083061684056}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9982326164649488, "4": 0.0008953274864221425, "3": 0.0006826781768465911, "5": 0.00018622498843578813, "1": 3.0651195023153448e-06}, "score": 2.0030289432613273}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9365578747704992, "3": 0.053920636927188174, "1": 0.008840307657973629, "4": 0.000677529136656568, "5": 3.709264310742558e-06}, "score": 2.0464465126528655}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7035277623656638, "2": 0.19719663516834976, "3": 0.05717891885581133, "4": 0.04016070696674488, "5": 0.0019309227143062219}, "score": 1.4397625071659748}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5463071858482678, "5": 0.30565547806347776, "3": 0.1478157667360833, "2": 0.00021676537728975394, "1": 0}, "score": 4.157406936751785}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6907624302814679, "5": 0.19519668260480355, "4": 0.0920158715467418, "2": 0.019967426662956166, "3": 0.002054353662438943}, "score": 2.0809139760651263}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8894106914576485, "2": 0.05264197361403867, "4": 0.028154386798535967, "5": 0.015510739872466603, "3": 0.014281942527279878}, "score": 1.2277120390639995}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9123674676550023, "1": 0.04356269997243347, "3": 0.03830035170268385, "4": 0.005517257344766739, "5": 0.0002521001824625839}, "score": 2.006528467771105}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8503759016674722, "4": 0.13278631459481366, "3": 0.011829187318649004, "5": 0.005006873052300433, "1": 1.6251133349987499e-06}, "score": 2.292420839283193}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6476846191168254, "3": 0.2568882277928858, "2": 0.07733955087268701, "5": 0.017904150885030393, "1": 0.00018329384179509103}, "score": 3.605786877736455}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984566927253736, "4": 0.0013183605788592465, "1": 0.0001958790854639103, "3": 1.818069938377991e-05, "2": 1.0434332363294154e-05}, "score": 4.997830457701539}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.9988113081545206, "2": 0.0011765557083548814, "4": 9.758986550203779e-06, "5": 2.314627015086624e-06, "1": 6.726633152445268e-08}, "score": 2.998837698005075}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5750789173713668, "3": 0.34760753799312943, "2": 0.06698058350658659, "5": 0.009605269738712823, "1": 0.000727452393171039}, "score": 3.5258540942334324}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9993340116687421, "4": 0.0006639389868392644, "3": 9.89337806443204e-07, "1": 1.6214943315589945e-07, "2": 0}, "score": 4.999333433141334}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982863111444528, "4": 0.001707278494450407, "3": 5.483527279088356e-06, "1": 2.5766874785572087e-07, "2": 0}, "score": 4.998280722625518}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6720876469197035, "4": 0.3190226422104558, "3": 0.004404989514324026, "2": 0.004283606431562735, "1": 0.00019925323590484534}, "score": 4.658518910791326}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.976030980263066, "4": 0.02392120918416278, "3": 4.5624897164177275e-05, "2": 6.237214265925568e-07, "1": 0}, "score": 4.975985632348367}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9988488958292653, "5": 0.0006760408870152558, "4": 0.0004555837473937484, "3": 1.902478414769388e-05, "1": 3.1291601659428724e-07}, "score": 2.0029580024435165}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.38122617683617144, "3": 0.3644950528695056, "2": 0.23301044455611875, "5": 0.0127062281527352, "1": 0.008561070827344714}, "score": 3.156506207624854}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999629731405111, "4": 3.625856241513665e-05, "3": 1.3923732299793586e-07, "2": 9.29924062828048e-08, "1": 0}, "score": 4.999963183965983}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5443538140859829, "4": 0.4549530464370347, "3": 0.0006920834618565972, "1": 0, "2": 0}, "score": 4.543662304739743}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9804807709615515, "4": 0.01932920527811478, "3": 0.00018648812384934276, "1": 0, "2": 0}, "score": 4.980297748814189}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9932343203688007, "2": 0.006764212040828916, "3": 1.4458415765723076e-06, "4": 2.8627100438495134e-08, "5": 1.3228754570806622e-08}, "score": 1.0067672423842324}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9436279748035898, "3": 0.04729460732623778, "4": 0.008778875102389632, "1": 0.0002866091835477514, "5": 1.176390044489525e-05}, "score": 2.0646010510105555}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.846325086655444, "4": 0.08789312422911394, "3": 0.06577381290718129, "2": 3.823057740160772e-06, "1": 0}, "score": 4.7805468693614195}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9107458315919115, "4": 0.08924386501614015, "3": 9.400008165673719e-06, "2": 1.693564790624896e-07, "1": 0}, "score": 4.910736761376438}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7870243899523728, "5": 0.20390579112804993, "2": 0.007781140170899222, "3": 0.0012882722492434703, "1": 0}, "score": 4.187055314574888}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9596378646597543, "4": 0.04029601896083544, "3": 6.507923698139541e-05, "2": 2.9387686025996307e-07, "1": 0}, "score": 4.959572910886558}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9570246741985082, "4": 0.04276372852775759, "3": 0.00018455722130378816, "1": 1.6990911066971087e-05, "2": 9.124339907649768e-06}, "score": 4.956771780388123}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9689203728783783, "3": 0.020917266766877187, "2": 0.007136750630391157, "5": 0.003016782237194611, "1": 6.7011058027449415e-06}, "score": 3.9678058424350704}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8723377256474926, "2": 0.11631314490571042, "4": 0.006918201790398755, "1": 0.004308359817841609, "3": 0.00011946322195850632}, "score": 4.626668838727067}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9254983220409464, "4": 0.0743043189808249, "3": 0.00018800133388998516, "2": 6.101572702090751e-06, "1": 2.0652774132856496e-06}, "score": 4.925293023563}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8834416089606123, "2": 0.11509243394925643, "3": 0.0013706813870167905, "4": 8.132329915460129e-05, "5": 1.3637871037851701e-05}, "score": 1.1181323552614204}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9122083281544954, "1": 0.06332335883321982, "3": 0.023997730874496744, "4": 0.0004636632609125539, "5": 6.889569202016092e-06}, "score": 1.9616223661459489}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9893112342112593, "4": 0.0056950380545897775, "2": 0.004722586226971896, "5": 0.00027044467750086173, "1": 1.5905941902127618e-07}, "score": 3.0015130238774415}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.9953429475543722, "2": 0.0034612918241947324, "4": 0.0011557382057423111, "5": 3.996961569993195e-05, "1": 0}, "score": 2.9977743854954353}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.522267484463043, "1": 0.46975504546554797, "3": 0.007521693251076308, "4": 0.000402144934797498, "5": 5.3654887141396685e-05}, "score": 1.5387319129264545}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8916261933373745, "3": 0.09819789497021478, "1": 0.007552085716735705, "4": 0.0025817391964645005, "5": 4.1856456322021504e-05}, "score": 2.0959348791113723}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9784761269910933, "4": 0.02150779180431411, "3": 1.5602537448201402e-05, "1": 0, "2": 0}, "score": 4.978460992810774}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6265820797870272, "4": 0.3724617429227433, "3": 0.0009535544777990664, "2": 1.9186533465753695e-06, "1": 0}, "score": 4.625625128542153}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9816015888047491, "4": 0.018381822688932774, "3": 1.5153424681053687e-05, "2": 1.2249287156021445e-07, "1": 0}, "score": 4.9815874788150225}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9846818252923647, "4": 0.01529239856285265, "3": 2.2133572156608367e-05, "1": 2.4022806523987644e-06, "2": 0}, "score": 4.984653706136339}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9969316953976234, "3": 0.002294679033349245, "5": 0.00039531509587088006, "2": 0.0003750457647900262, "1": 3.2114243387495444e-06}, "score": 3.9973409101182384}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6561204461209752, "1": 0.3318720420066391, "3": 0.011559426820140658, "4": 0.00043087824584842706, "5": 1.7136412027373625e-05}, "score": 1.6806005280573562}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8949682018479034, "4": 0.10347251056086251, "2": 0.0009091454187127504, "3": 0.0006300613892953728, "1": 1.9494055208046356e-05}, "score": 4.892461891087954}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7649375901399189, "2": 0.214912007944677, "3": 0.019585910956048114, "4": 0.0004923168720009291, "5": 7.159079884549392e-05}, "score": 1.2558472929009443}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4081186655212161, "2": 0.36639873452332944, "3": 0.1446955209307023, "5": 0.046478446034038064, "1": 0.03430624058863306}, "score": 3.0660644999415436}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5690257449053615, "5": 0.21852160294942277, "3": 0.08548146586901485, "2": 0.06901221921437957, "1": 0.05795416728776137}, "score": 3.821152338359998}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8070081593859845, "4": 0.18932381936962084, "3": 0.003345883147733433, "2": 0.00023653331337867588, "1": 8.043710365387678e-05}, "score": 4.802952047699471}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962201493877613, "1": 0.0027530097809354247, "4": 0.0009667106806378761, "3": 4.576659956630463e-05, "2": 8.444197828165266e-06}, "score": 4.987904312804358}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9994697456345629, "5": 0.00038634863370835744, "2": 9.747077192794588e-05, "4": 3.5526701119156756e-05, "3": 9.262866499756579e-06}, "score": 1.0017679740521293}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9968492396961173, "1": 0.0027219016688534215, "4": 0.00040804789530353143, "3": 1.1355004342229505e-05, "2": 0}, "score": 4.988681528396126}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8935733454061167, "3": 0.05529652010559302, "1": 0.04511294702257411, "4": 0.005576145008686849, "5": 0.0004409998599902079}, "score": 2.0226588636455634}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8216942350099958, "1": 0.17678363416556975, "3": 0.0015142878750509618, "4": 7.530869886870139e-06, "5": 2.601618238806979e-07}, "score": 1.8247464868359724}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6903517007621452, "5": 0.21495860591903732, "3": 0.09076194401565764, "2": 0.0038958924453990264, "1": 3.0246048806065514e-05}, "score": 4.1163143262263215}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8612614432070097, "5": 0.09850027883459792, "2": 0.022983516359790096, "3": 0.017253166278010587, "1": 0}, "score": 4.035280136120135}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5619048216081597, "5": 0.4359507241607705, "3": 0.0021374195399296867, "2": 3.713439581241432e-06, "1": 0}, "score": 4.43380731852491}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.802016137297079, "2": 0.08592105237364323, "4": 0.04972207398078123, "5": 0.042662216924556635, "3": 0.019677907878417476}, "score": 1.445092229965209}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5511646688170069, "2": 0.28195657761184967, "4": 0.06256956507568119, "3": 0.05753074375879966, "5": 0.04677787239228962}, "score": 1.7718386916831832}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9988848142822757, "4": 0.0011040699197784915, "3": 1.0323961554609615e-05, "1": 0, "2": 0}, "score": 4.9988752812665185}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999961110815618, "4": 3.1867435286203833e-06, "1": 0, "2": 0, "3": 0}, "score": 4.999996813254234}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7858214619509232, "4": 0.20762668406331153, "3": 0.006549719858135066, "2": 3.980110771556124e-07, "1": 0}, "score": 4.779272298978171}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9979806137096249, "2": 0.002018123822326999, "3": 1.0297875902993067e-06, "5": 7.963166672725697e-08, "4": 2.1420402098446297e-08}, "score": 1.0020205664513446}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7166516501694435, "2": 0.27823783763178644, "3": 0.004086977825632943, "4": 0.000987237420340743, "5": 3.6232972904231836e-05}, "score": 1.289518455959051}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5631245780052836, "3": 0.32864563696113547, "2": 0.08144655831614758, "5": 0.026219795501750888, "1": 0.000563269702070268}, "score": 3.532991157373825}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8981191515627259, "4": 0.08286158614888378, "2": 0.01542790339998104, "3": 0.0023293628587019604, "1": 0.0012597959696246126}, "score": 4.861156488591204}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5193878668296796, "4": 0.4702025874594934, "3": 0.009229442806032818, "2": 0.0011717503763209998, "1": 7.804726860975056e-06}, "score": 4.507791787259581}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8109580520018055, "2": 0.18891292204722365, "3": 0.00011737765510368717, "4": 1.0620150116295838e-06, "5": 0}, "score": 1.1891528658278283}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9121838311287781, "2": 0.08555924662766111, "3": 0.0021773581388361417, "4": 7.563563676997218e-05, "5": 3.7701906028394862e-06}, "score": 1.090155964847702}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9985510560344005, "2": 0.0008296253870186473, "4": 0.0003170490703531337, "3": 0.00026962835772977435, "5": 3.230773121097163e-05}, "score": 1.0024492610550124}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9485205196982609, "3": 0.045234418982974436, "5": 0.0047093894867634295, "1": 0.0008564125046007176, "2": 0.0006776368723540573}, "score": 3.9555503871277806}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9233011857059035, "3": 0.05106239309371722, "1": 0.021587718801416713, "4": 0.0036993224415743896, "5": 0.00034781542737428116}, "score": 2.0379168247795825}]