[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3284757382333648, "2": 0.26467823454748346, "1": 0.2617558447415968, "4": 0.11291139306842939, "5": 0.031926579594329846}, "score": 2.3884203818441843}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3450856610057624, "3": 0.3131086888490052, "5": 0.21645136474193064, "2": 0.07531913948846632, "1": 0.049942976219559385}, "score": 3.6028388620362537}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4569404970302669, "3": 0.28239643426023703, "5": 0.19188575693694718, "2": 0.04803640106306249, "1": 0.02064940445381366}, "score": 3.751445562903275}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.38645715921845, "5": 0.32068443753877546, "3": 0.21335110288327372, "2": 0.0448534845532649, "1": 0.03458117915408311}, "score": 3.9138765723692672}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7505295912287759, "4": 0.21452236077714734, "3": 0.031223583134400545, "2": 0.0022388738165731938, "1": 0.0014769685039502055}, "score": 4.710403480431203}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5930041391452017, "4": 0.25953663785576125, "3": 0.09474240467255092, "1": 0.026420852848404702, "2": 0.02612694034176579}, "score": 4.366807294896927}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4806090813494956, "4": 0.3293505150693643, "3": 0.15269465051758335, "2": 0.02414929721826378, "1": 0.013030672206964045}, "score": 4.240563701300143}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3536579768425843, "4": 0.26279374342975526, "5": 0.15676335558571886, "2": 0.1416041627786963, "1": 0.08496765706669161}, "score": 3.2648374156802826}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5789121731776641, "4": 0.30228968485256175, "3": 0.09217256060817787, "2": 0.015472778884280442, "1": 0.011028196143773716}, "score": 4.422762145210479}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.46159153608225323, "4": 0.3293520959556308, "3": 0.15018561748439418, "2": 0.03476368053445417, "1": 0.02393256967104959}, "score": 4.1701105328500905}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3395620771330294, "2": 0.26573954606836214, "1": 0.2120892292864639, "4": 0.11666414822997451, "5": 0.06588200104794675}, "score": 2.5584823308510436}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.302007870707956, "1": 0.2448646916449096, "2": 0.23479919957478465, "4": 0.1349804939827389, "5": 0.0831428970768809}, "score": 2.5766509834905222}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5471226930364771, "4": 0.29267500018040515, "3": 0.13199925504634324, "2": 0.0163104218203703, "1": 0.011829261842763861}, "score": 4.347036799874592}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.43741306565658344, "4": 0.35376805233183556, "3": 0.16130614465519813, "2": 0.029538180447543888, "1": 0.017906186702720064}, "score": 4.163323166436692}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2808418723196459, "4": 0.2499060079534122, "5": 0.1722902542033699, "1": 0.1505039875192016, "2": 0.14639078842921194}, "score": 3.1470976216094773}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.62583302292756, "4": 0.249307900056409, "3": 0.09967926475734924, "1": 0.013664118083922684, "2": 0.011449944455977346}, "score": 4.462291910569602}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3802152269072613, "2": 0.23230344717307777, "1": 0.17131921642436646, "4": 0.16490825335533077, "5": 0.05103515857245623}, "score": 2.691969324919075}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.39985970535864934, "4": 0.2603694226712707, "2": 0.1465138230040083, "5": 0.09880699274120752, "1": 0.09431808746945548}, "score": 3.122849622522553}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3588509348435259, "5": 0.35405716352517475, "3": 0.1982670340678784, "2": 0.05058637539066676, "1": 0.03815358707937946}, "score": 3.9401515359984005}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3275299754512012, "4": 0.2632299484762821, "2": 0.1586247070115813, "5": 0.12634199536801025, "1": 0.12415498683667395}, "score": 3.108992161766761}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3257715533028247, "4": 0.2852501968910143, "2": 0.1859592342480043, "1": 0.10304785366043863, "5": 0.09986845589461181}, "score": 3.092941712783198}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.602256888266032, "4": 0.2732214337319401, "3": 0.10712614646476146, "2": 0.011842772654986379, "1": 0.005325487618658545}, "score": 4.455572272121278}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3764591413281344, "4": 0.2910660388291093, "5": 0.1869624844814947, "2": 0.10000070930192011, "1": 0.04538155654392373}, "score": 3.4742888759265913}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4283287803116622, "5": 0.36854590592861747, "3": 0.1625824046838895, "2": 0.027458450713224735, "1": 0.01293058297768696}, "score": 4.112272126801945}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3912705948182629, "5": 0.3761291163465335, "3": 0.18346040707996075, "2": 0.03397575149946515, "1": 0.01500132122638346}, "score": 4.079726222737433}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4306310663493498, "3": 0.25685578485852995, "5": 0.2175250636326082, "2": 0.06356899039142723, "1": 0.03114635671434611}, "score": 3.7400213217694707}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.456010086588849, "5": 0.411102624914071, "3": 0.11346940929705579, "2": 0.013373782745820195, "1": 0.0059809210568218165}, "score": 4.252958867731899}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.680611241505412, "4": 0.26775764963420634, "3": 0.04701496141260018, "2": 0.002966778485146643, "1": 0.001585599039742776}, "score": 4.622945651199434}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7578076010734499, "4": 0.20851577106591046, "3": 0.029762888914163003, "2": 0.0025294762841067383, "1": 0.0013355565267869937}, "score": 4.719014110409461}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8454957899645626, "4": 0.13686154289412936, "3": 0.015760507394313502, "2": 0.000966031032042627, "1": 0.0008446870958116436}, "score": 4.825328121996087}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"2": 0.323532955019276, "3": 0.29147151402729277, "1": 0.22548018393961566, "4": 0.1248285104523401, "5": 0.03463415309827911}, "score": 2.4195729148414116}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4105780517161675, "4": 0.21628558322527475, "2": 0.17522926092729546, "5": 0.11254764903844246, "1": 0.08527914025952303}, "score": 3.095601018035645}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5231359531690659, "4": 0.3590050585229335, "3": 0.09397791228638484, "2": 0.015551680118308351, "1": 0.008251766337804112}, "score": 4.373328362951258}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.3736351845502999, "4": 0.34209154578667844, "3": 0.1989952149548015, "2": 0.05493508849097846, "1": 0.03019803871264864}, "score": 3.9741719332783374}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2601737765190676, "1": 0.20242769862864915, "4": 0.20045894826639968, "2": 0.1706687731518992, "5": 0.16621736823584782}, "score": 2.957367236238719}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3743061138929897, "5": 0.3461435865430971, "3": 0.1891543936088981, "2": 0.049830292337961615, "1": 0.040399009970338184}, "score": 3.936120935862227}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.313618876310727, "3": 0.2526789672867301, "5": 0.23992027459852586, "2": 0.09754488967597602, "1": 0.09595587774392596}, "score": 3.504144502615308}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5700044335647609, "4": 0.31635913739214605, "3": 0.08977949235194857, "2": 0.01254729718930956, "1": 0.011219297413117339}, "score": 4.421510534736966}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6059955719213487, "4": 0.2910528247309088, "3": 0.08101335997074724, "2": 0.012153634720288322, "1": 0.009656712592617403}, "score": 4.471765141636963}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4247632602351639, "4": 0.37534664249542576, "3": 0.14277234647007483, "2": 0.030126011830528127, "1": 0.026844862959513424}, "score": 4.141225043796338}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5014538498710379, "4": 0.2995122981497646, "3": 0.12445799619034985, "1": 0.042230735232232496, "2": 0.0322399052578604}, "score": 4.185843391036179}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7901729132022867, "4": 0.1692161816759835, "3": 0.0353395127386405, "2": 0.002997250231916757, "1": 0.0022138940508913962}, "score": 4.742241936513762}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3924778172175438, "4": 0.28180503849309035, "3": 0.21345812529499636, "2": 0.06790581550497655, "1": 0.04426020555981701}, "score": 3.9104191133961597}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8883964756903111, "4": 0.0920117493280349, "3": 0.015605123330850209, "1": 0.002290824230938176, "2": 0.001616734831136704}, "score": 4.862753647423783}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.47161802033068234, "4": 0.2762938792084763, "3": 0.15152338644080535, "1": 0.054019077919836095, "2": 0.04631420321638355}, "score": 4.065424134993834}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.37592414423543724, "2": 0.2735013284255738, "1": 0.17600031397442145, "4": 0.14411929281963054, "5": 0.030391965447257967}, "score": 2.5793747868383488}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.36458400051357703, "3": 0.273646842478195, "5": 0.2525173297370129, "2": 0.06757168801550231, "1": 0.041542299740246286}, "score": 3.7190614875786467}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.38344982544258277, "4": 0.2544848431927034, "5": 0.21770731718142128, "2": 0.08940075961738572, "1": 0.054894462541904304}, "score": 3.4907406074503533}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.796006967528146, "4": 0.1658257567558078, "3": 0.030202861724538305, "1": 0.004732200323361997, "2": 0.0031300133789947293}, "score": 4.745423660589184}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.33134842955313365, "5": 0.2624398410940611, "3": 0.2565335817343596, "2": 0.09192128187393336, "1": 0.05767272043619504}, "score": 3.6490160006464096}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30989055259100257, "4": 0.26665771747878686, "2": 0.19270447137823776, "1": 0.1408598154263149, "5": 0.08966737396446349}, "score": 2.9715621048731196}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5004220182792491, "4": 0.38603073049688397, "3": 0.09452244116775087, "2": 0.01114372633463191, "1": 0.007806836147185469}, "score": 4.360218361340226}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.48025301469886156, "5": 0.3499166834927403, "3": 0.14875417019871875, "2": 0.013208726094945198, "1": 0.0077908680031401134}, "score": 4.151384043652707}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.401633981056373, "5": 0.3183531429319707, "3": 0.20167634883899688, "2": 0.043583135670517165, "1": 0.034691017056345565}, "score": 3.925432820496406}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3097065012915602, "3": 0.23347170195225855, "2": 0.1936881669513041, "4": 0.1909014600565915, "5": 0.07214581497132692}, "score": 2.5220506472550674}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.35373755884001296, "3": 0.33712503287718776, "5": 0.14906399031934076, "2": 0.10317940601153978, "1": 0.056722784836491465}, "score": 3.4353151015433117}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.39043354634383, "3": 0.2856407433222899, "5": 0.2187236539682627, "2": 0.07106392179515833, "1": 0.033857707832692346}, "score": 3.689294813515726}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3675488661695568, "4": 0.3208766813222883, "2": 0.13460590392392252, "5": 0.11244470379458765, "1": 0.06428057454446007}, "score": 3.28266780056377}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.38627143004195486, "3": 0.2700010853977975, "5": 0.22752421652327018, "2": 0.07436644849093457, "1": 0.04155015613192559}, "score": 3.6840491942111457}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3204950010791478, "4": 0.21995330613451794, "2": 0.20143359605952335, "1": 0.15461750833266272, "5": 0.10331997011515899}, "score": 2.9159094453487264}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"5": 0.47105735008011146, "4": 0.37264414111398275, "3": 0.11921945793058665, "2": 0.019649358254583478, "1": 0.017329292521604017}, "score": 4.26057746007837}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6021182345806269, "4": 0.28115465145265717, "3": 0.08916311802113105, "2": 0.01378234849670745, "1": 0.013669434459825406}, "score": 4.444431987228322}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4876631392060475, "4": 0.31165885588722864, "3": 0.16865536610243814, "2": 0.020474153360755212, "1": 0.011454197755137056}, "score": 4.2437198528982325}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9500390708715895, "4": 0.04520636877355116, "3": 0.003919803711619277, "1": 0.00042533545265877314, "2": 0.000274822533868748}, "score": 4.944420733496356}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.39840992557108157, "4": 0.36125185666919385, "3": 0.15338933754409143, "2": 0.043622919069929864, "1": 0.043106145716825445}, "score": 4.0284625692485205}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.563451093422991, "2": 0.23613282841978214, "3": 0.125370929478347, "4": 0.053823236492149484, "5": 0.021136581907499286}, "score": 1.7329532675899086}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.39799528121965805, "5": 0.31217264339386636, "3": 0.19381947391038457, "2": 0.05739365625326545, "1": 0.03849349550052645}, "score": 3.888071329054684}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4287501631402581, "5": 0.2569606290963424, "3": 0.23328177997094565, "2": 0.05311398045409002, "1": 0.027694323903983985}, "score": 3.834334928707312}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5166547099691128, "4": 0.32092061234697133, "3": 0.11817319220846534, "2": 0.023882514468503178, "1": 0.020265892062679963}, "score": 4.2899487002415135}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.43081625598461576, "5": 0.354469667799765, "3": 0.16021416941112301, "2": 0.03439943978689745, "1": 0.01998290142176584}, "score": 4.065515616932091}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7274341132625242, "2": 0.21643017519056784, "3": 0.04254509954182828, "4": 0.007156036591123566, "5": 0.0063613255724884145}, "score": 1.3484593109268321}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.275906289973378, "4": 0.2720285105447373, "2": 0.18584198673685332, "5": 0.14490487301902052, "1": 0.12119663133486272}, "score": 3.1336192697625487}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.45348200068232386, "2": 0.3020133068985543, "3": 0.17002593410638783, "4": 0.05149434413318489, "5": 0.022824645131096388}, "score": 1.8879886611386971}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7846244133709765, "4": 0.16033706874981205, "3": 0.045179628077163046, "2": 0.006096755710642344, "1": 0.0037044417735250653}, "score": 4.716179266593862}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5136251806822963, "2": 0.2674556288132364, "3": 0.12746331261322047, "4": 0.06986757600145897, "5": 0.021437186029874235}, "score": 1.817857317375353}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"1": 0.38287852776110615, "2": 0.2972894011401159, "3": 0.19666128412125317, "4": 0.09370465604410604, "5": 0.029245808930436133}, "score": 2.0889490926819305}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.44729627335495775, "5": 0.2740135558260925, "3": 0.22670510567443725, "2": 0.03633149801665559, "1": 0.015475718991569801}, "score": 3.9282055286307056}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.32050945572964634, "3": 0.2921942377750869, "5": 0.2700778036034641, "2": 0.08024825995586872, "1": 0.036826834543221554}, "score": 3.7068645041966755}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.30912792221588664, "3": 0.2861508098419944, "5": 0.1770202050674165, "2": 0.1431018019866093, "1": 0.08449473958405256}, "score": 3.3511137500630284}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2973144636930038, "3": 0.27227796618555766, "1": 0.23773613424343684, "4": 0.13970082600931716, "5": 0.05292260053869079}, "score": 2.4727339812185303}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9510284870960015, "2": 0.039219586553329834, "3": 0.0069906949994763675, "5": 0.0013977283043732777, "4": 0.0012731122318720178}, "score": 1.062616886456788}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2583649134901454, "3": 0.24006907129098518, "5": 0.19863780261321534, "1": 0.15841921502229067, "2": 0.14443367114948477}, "score": 3.1943830597052036}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4537362939636534, "2": 0.2538064779982004, "3": 0.15967518834227984, "4": 0.08768641453363084, "5": 0.04504713017790903}, "score": 2.0164539119118157}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6509307156567362, "4": 0.2214215562671909, "3": 0.07922301729283351, "1": 0.027867718585180817, "2": 0.020384258870134928}, "score": 4.447413308057749}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4887450722921934, "4": 0.26114773429849897, "3": 0.1353687828646217, "1": 0.06344147193010329, "2": 0.051164947527424405}, "score": 4.060729994400397}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8367265955016205, "2": 0.12738490856045004, "3": 0.02479625860236504, "4": 0.0078502884707246, "5": 0.0032082056040294085}, "score": 1.2133683133361173}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4924268782259762, "4": 0.34580736760093883, "3": 0.13377784874016396, "2": 0.01908221174749752, "1": 0.008809546640555225}, "score": 4.294084241399905}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6842169454071504, "4": 0.25355969511106174, "3": 0.0510307697375416, "2": 0.0058927682512906485, "1": 0.0052477083627857565}, "score": 4.605689078432457}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7315269625057084, "4": 0.21040586984602813, "3": 0.04630660367919481, "2": 0.006024583082048253, "1": 0.0056754087033295915}, "score": 4.656184713093404}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.35495814424255107, "4": 0.324549601291433, "3": 0.20934524498633242, "2": 0.060504429605845636, "1": 0.05049244287189536}, "score": 3.873107660193373}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"2": 0.34954184370389896, "1": 0.26440824174206884, "3": 0.2639003788215593, "4": 0.1032892989693887, "5": 0.018745660375380484}, "score": 2.2623377738588966}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3481941682726865, "3": 0.2927914494557021, "5": 0.1824273987823791, "2": 0.11677199572080663, "1": 0.05970606335532745}, "score": 3.4769167912875707}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.32187905808528766, "5": 0.27302675088718475, "3": 0.21168492767468175, "2": 0.10161367057354105, "1": 0.09158693028136687}, "score": 3.5832667346171916}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.39197424612917076, "4": 0.3667467586628037, "3": 0.17130880053265418, "2": 0.03899353171769974, "1": 0.030928428557301005}, "score": 4.04989550316889}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30908644003224206, "4": 0.2846324728131196, "2": 0.18069166655824542, "1": 0.12107116085650474, "5": 0.10443737181626134}, "score": 3.0706789452475123}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7440018184491118, "2": 0.2012727551514022, "3": 0.04268417655111334, "4": 0.008251959431395601, "5": 0.00369833337499761}, "score": 1.326219992053318}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.475110438436648, "2": 0.22689598100044378, "3": 0.18219854134111296, "4": 0.060649766109310506, "5": 0.05499394448961254}, "score": 1.9933684650508723}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5517981554454643, "2": 0.2944253760559037, "3": 0.12290647238063125, "4": 0.022632824837882846, "5": 0.008165608744341463}, "score": 1.6408450908079186}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.43465166013018314, "2": 0.2554084118355192, "3": 0.1894890764849538, "4": 0.0951031487589949, "5": 0.025238065208802538}, "score": 2.0207601855957087}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4625711712892114, "2": 0.31640966398082826, "3": 0.1640478869798914, "4": 0.05000458888826562, "5": 0.00682096719318037}, "score": 1.8219228453466327}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"1": 0.31952495557463984, "2": 0.2662068076252691, "3": 0.22720417873153176, "4": 0.13901912018827206, "5": 0.04785011776297478}, "score": 2.3293319773168157}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4760693557536032, "4": 0.2921665975075986, "3": 0.17505896831806358, "2": 0.031473268892759795, "1": 0.025094589847540955}, "score": 4.162802419803417}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5105882125136917, "4": 0.2861355584102841, "3": 0.16017170226408117, "2": 0.022986366492523287, "1": 0.019965719520957843}, "score": 4.244583903267195}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9157199797558072, "4": 0.07144223913713833, "3": 0.010970806376139978, "2": 0.0008999377173311391, "1": 0.0006973492476710327}, "score": 4.90110026591957}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32931596801235835, "3": 0.29885385629917377, "2": 0.14420678536537027, "5": 0.12699773847062645, "1": 0.1005027689621865}, "score": 3.2381283835679}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.38056068381293706, "3": 0.2508376906038383, "5": 0.21467891193442626, "2": 0.09293899210139903, "1": 0.06093645981940719}, "score": 3.595134723036975}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5578283111818076, "4": 0.36825430252534264, "3": 0.06476758708958996, "2": 0.0061401445177944845, "1": 0.0029561663562299918}, "score": 4.471937179119154}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.43447796023221824, "4": 0.3616881147419872, "3": 0.16730181872640537, "2": 0.02484737912024075, "1": 0.011574822660897394}, "score": 4.182777003301133}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6670125284230252, "4": 0.26977513508510076, "3": 0.054609888749608385, "2": 0.005329214633354286, "1": 0.0031743871147356904}, "score": 4.592279593527753}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5820792919888077, "4": 0.2614764387287817, "3": 0.10595194889060061, "2": 0.02766764774001187, "1": 0.022634628745907208}, "score": 4.352955238372567}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2981064623707133, "1": 0.26604662595926776, "2": 0.24980424196242368, "4": 0.14592313040515803, "5": 0.03989026379602799}, "score": 2.4436786132485815}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.36162797100959554, "4": 0.24836058923118412, "2": 0.19828545393093272, "1": 0.13988000934216055, "5": 0.051730087680702384}, "score": 2.8737606622512852}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4004812860629575, "3": 0.39204448244678236, "5": 0.09887907896405976, "2": 0.08679967513562219, "1": 0.021668673044241474}, "score": 3.468161787716443}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4610199921527968, "4": 0.3714049731028906, "3": 0.1392404756500687, "2": 0.01864291123098541, "1": 0.009625311843581433}, "score": 4.255634716299583}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6042499754665711, "4": 0.32283449062937286, "3": 0.06616024004656043, "2": 0.004486461376902422, "1": 0.002227828354623426}, "score": 4.522454750402734}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3598414000578076, "2": 0.2789265481783162, "3": 0.21664810016033081, "4": 0.10649661269704683, "5": 0.03764485076347134}, "score": 2.182815371421248}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33358889413964754, "2": 0.30641046101642505, "4": 0.16225605583432684, "1": 0.15677400017894294, "5": 0.04061328699611889}, "score": 2.623389604867166}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.366649436988212, "4": 0.361750113397987, "3": 0.20159210605999395, "2": 0.04690418852257461, "1": 0.0226744191415327}, "score": 4.003227083251963}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4584213223216937, "4": 0.38367683739365593, "3": 0.1284656532832005, "2": 0.0198069835286445, "1": 0.009426070228491732}, "score": 4.262116735918686}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.353141341972507, "1": 0.3254742921573089, "3": 0.20564870118156947, "4": 0.09136961459955864, "5": 0.024176250789870363}, "score": 2.1354681023438755}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29237276453204114, "4": 0.23309010113860246, "2": 0.21805472839865425, "1": 0.16951731567579842, "5": 0.08669432091946765}, "score": 2.8493485914455103}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.37315143864705225, "2": 0.22429123844250057, "4": 0.2202523818329068, "1": 0.13101520418955911, "5": 0.0511317164572979}, "score": 2.836168279166798}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.30545869930516606, "3": 0.29663385860837643, "1": 0.2767458785018109, "4": 0.0901175815196906, "5": 0.03088246598459118}, "score": 2.2928178358888336}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6421483032641124, "4": 0.2638897438505889, "3": 0.07397692934463573, "2": 0.011123458748366347, "1": 0.008628211823927878}, "score": 4.5201612021115025}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.24067305133897418, "3": 0.23736106883438457, "1": 0.18255180193812698, "5": 0.17319396977525678, "2": 0.1660689027398553}, "score": 3.0558969361904866}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"4": 0.42065004416207485, "5": 0.26003532287053416, "3": 0.21201212766062036, "2": 0.0642783761864028, "1": 0.04287517893901582}, "score": 3.7908097470939537}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6517249903351982, "4": 0.28522144512028125, "3": 0.05430355416220634, "2": 0.005538514250619189, "1": 0.0030956449811530094}, "score": 4.5771243332463065}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.398945138116875, "5": 0.2916869619164278, "3": 0.2135721210165414, "2": 0.057271486323335646, "1": 0.03828129053232519}, "score": 3.8486912283078025}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8285646355588534, "4": 0.14135220434818088, "3": 0.024365477624142, "2": 0.0030608868033098094, "1": 0.0024872539708848734}, "score": 4.790749687457476}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7290544415464058, "4": 0.20088979597784262, "3": 0.05505466930854313, "2": 0.008224818906663652, "1": 0.0066936711733126325}, "score": 4.637521782171983}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7446996769980156, "2": 0.21437983658221085, "3": 0.038041755255734784, "4": 0.002049076653961085, "5": 0.0008110299295736812}, "score": 1.2998602815458118}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3316618013154181, "3": 0.2895389061941377, "1": 0.2795355788094628, "4": 0.08159034051995571, "5": 0.01757444536434289}, "score": 2.2259296952445706}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3558661862896514, "2": 0.2860790808255749, "1": 0.2605604476461538, "4": 0.07263945844823487, "5": 0.024769545115038}, "score": 2.3149201478028862}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2789428379643869, "4": 0.27650615441095244, "5": 0.20592134571925652, "2": 0.12199597824465387, "1": 0.116589157294832}, "score": 3.3331893887277895}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.45590007374763974, "2": 0.2505455596861146, "3": 0.18675622914438592, "4": 0.07022151734713632, "5": 0.03653697929116507}, "score": 1.9809093711970296}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.34570740914065706, "5": 0.31394153646852563, "3": 0.21406625694235273, "2": 0.07391205045336048, "1": 0.052235444557923144}, "score": 3.7953167414354314}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33695809619368616, "4": 0.2983706420629932, "2": 0.16648277972257858, "5": 0.11466215006736634, "1": 0.08339327569718938}, "score": 3.194451484067248}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8151969976839453, "4": 0.15810672488963676, "3": 0.02405633999296899, "2": 0.0016773854124100122, "1": 0.0008956247844963843}, "score": 4.785151560536881}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6133107919365262, "4": 0.2715649341674681, "3": 0.08768644083955918, "2": 0.016250428521503924, "1": 0.011081997878207007}, "score": 4.459925979679202}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4544896854052557, "4": 0.348721315043733, "3": 0.15460784504037298, "2": 0.028396831697086355, "1": 0.013693623396669687}, "score": 4.202025630387571}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3530857265909726, "2": 0.25773295196974416, "3": 0.22920838753071016, "4": 0.1074606118447517, "5": 0.05244209345112838}, "score": 2.248387608899809}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27855587816766214, "1": 0.2549968466445438, "2": 0.2408411479391135, "4": 0.1450654875853335, "5": 0.08044932466882879}, "score": 2.5550886686190037}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3048084598931104, "5": 0.2985254769127826, "3": 0.20179644251179588, "1": 0.097395876982965, "2": 0.09733570492607017}, "score": 3.609816133097612}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5377291038896489, "4": 0.2923972663963227, "3": 0.13164278486141381, "2": 0.025159664044534406, "1": 0.012971529002197708}, "score": 4.316883981993635}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32948379724892807, "5": 0.28487647890855405, "3": 0.2350617578504653, "2": 0.08885019763651403, "1": 0.061659522539126634}, "score": 3.6871144050348086}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"4": 0.43676123770808367, "5": 0.3576877785717176, "3": 0.15829761160268352, "2": 0.02800681515585867, "1": 0.019118196521443}, "score": 4.086032990325499}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.47566064960387633, "5": 0.3262704957814018, "3": 0.17303984380332274, "2": 0.017712405662862283, "1": 0.0071753603184360835}, "score": 4.096293360636408}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4992086172282928, "4": 0.3928817904569108, "3": 0.09914035555531335, "2": 0.005932269643446906, "1": 0.0027595407721474844}, "score": 4.3799545185588595}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8727768313630606, "4": 0.10596771571361811, "3": 0.018027083734928707, "1": 0.0015197582542944544, "2": 0.001503649238104142}, "score": 4.847356850086146}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7418655141636504, "4": 0.2215040954614351, "3": 0.03146999584299647, "2": 0.0027608065877749296, "1": 0.0023173592405398534}, "score": 4.697979221349998}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3682143270081708, "2": 0.2552823988805325, "1": 0.16630023162001661, "4": 0.1586052132330068, "5": 0.05150934662063711}, "score": 2.673712173546202}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33750025942607365, "4": 0.2557322449553018, "2": 0.18431017627759752, "1": 0.1253857241208922, "5": 0.09697820659501469}, "score": 3.014608397884143}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3913544922272728, "4": 0.29299580132984904, "2": 0.15570984057309764, "5": 0.09059411716454852, "1": 0.06922047352006089}, "score": 3.1800558045699856}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.41084137002407806, "5": 0.2687091261099936, "3": 0.23361355574065867, "2": 0.05205469428476766, "1": 0.03468370842904271}, "score": 3.826918173174658}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.36708241210210363, "3": 0.2532657363937515, "5": 0.2501905128333948, "2": 0.07887653477420681, "1": 0.05051449773702681}, "score": 3.6876062504753637}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3285419984718868, "4": 0.28971230503904083, "2": 0.14196899362177268, "5": 0.1392100410087191, "1": 0.10043768435163417}, "score": 3.2253170855674065}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.36530144117742575, "3": 0.25234865401811635, "5": 0.19528391596907374, "2": 0.11812847211902525, "1": 0.06871368501193174}, "score": 3.5004254420523178}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3992954339958519, "5": 0.36757257383598874, "3": 0.18189743403811967, "2": 0.03328057119051108, "1": 0.017667088094093238}, "score": 4.066131706244735}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7554469863620661, "4": 0.21666801103562625, "3": 0.024618841858760645, "2": 0.0020024016376569203, "1": 0.001078442185467336}, "score": 4.723722132628449}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.467377498446139, "4": 0.4239431258048913, "3": 0.09115614169861287, "2": 0.011673503074085679, "1": 0.00565963147109966}, "score": 4.335959321886905}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5688787845362013, "2": 0.230386349241363, "3": 0.12117835626083262, "4": 0.05588775358574947, "5": 0.023405224788085027}, "score": 1.7342207120226285}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.2803933893175329, "4": 0.26460516697436753, "3": 0.22849361777517252, "1": 0.1338585009517022, "2": 0.09244153392288806}, "score": 3.465330101217348}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5278268102359417, "4": 0.2759574753374638, "3": 0.12564731300254295, "1": 0.0389141438238007, "2": 0.03139340939428716}, "score": 4.222708340044377}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.3783579400764861, "3": 0.163434268010105, "4": 0.16073574465732432, "2": 0.15063767935342653, "5": 0.14667488620521021}, "score": 2.546659658074094}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3022100117930052, "3": 0.19983245270627883, "4": 0.18098281445256875, "5": 0.16117897265577882, "2": 0.15550890221973476}, "score": 2.7433382115066904}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.30152890402407984, "1": 0.2716729026861211, "3": 0.267722843402208, "4": 0.12777185349347642, "5": 0.03114666817947058}, "score": 2.345087771740589}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3883512948062938, "5": 0.2940108816245481, "3": 0.23880768887810971, "2": 0.05166962987273856, "1": 0.026995232571346218}, "score": 3.870856891515204}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5762267111374411, "4": 0.3060311453560195, "3": 0.09675337151298312, "2": 0.012573887953852638, "1": 0.008268316977736478}, "score": 4.429583575586086}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5468169642587143, "4": 0.34026154741349735, "3": 0.08788836933971404, "2": 0.016383754735404446, "1": 0.008469176504629682}, "score": 4.400825779828927}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.36158631386683276, "5": 0.33184569241259654, "3": 0.20386829630081654, "2": 0.0604330220957867, "1": 0.04200453459412286}, "score": 3.881066570841916}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8080008730129933, "2": 0.13838460189116683, "3": 0.0371509847785045, "4": 0.010956997343572977, "5": 0.005420869782118043}, "score": 1.2672639399621146}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4384836298595746, "4": 0.35941973326670357, "3": 0.15551635127455454, "2": 0.029627479109706607, "1": 0.01685915578038283}, "score": 4.173151068744824}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5007024332307837, "4": 0.3408227607564126, "3": 0.13100075400947905, "2": 0.017644248724623838, "1": 0.009763522810332773}, "score": 4.305142838351303}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7745596845920697, "4": 0.1666275994508002, "3": 0.045899961531943895, "2": 0.006434192058830038, "1": 0.006379688546372687}, "score": 4.696721160785978}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7608539180954322, "4": 0.19263982987230932, "3": 0.038299731242012025, "2": 0.004335111275457799, "1": 0.0037657847745321267}, "score": 4.7026608283463895}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30641177858424024, "4": 0.2616283745175166, "2": 0.16286696126449313, "1": 0.1406818248250609, "5": 0.1283566193938863}, "score": 3.0741150373181636}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.41157633986321274, "4": 0.36087252476651666, "3": 0.16701534242113575, "2": 0.03125909203487654, "1": 0.029216869906775314}, "score": 4.0943978515705615}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3491581177236628, "3": 0.32890208055796627, "5": 0.19685507123478332, "2": 0.08281961910049165, "1": 0.0422098572961553}, "score": 3.5756607341086784}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5308529640212232, "4": 0.30400069238386673, "3": 0.12739132892163318, "2": 0.024041816754980336, "1": 0.013586800622291574}, "score": 4.314657371563689}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6391207342268148, "4": 0.2710593441424635, "3": 0.0746093831642789, "2": 0.009518484823891126, "1": 0.005613984286674284}, "score": 4.528673701770097}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5888282993309764, "4": 0.27720219312259864, "3": 0.08569439997750239, "1": 0.03022701856789845, "2": 0.017908539730243322}, "score": 4.376688330771163}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7221417859045733, "4": 0.20151847791265012, "3": 0.057923621903238104, "1": 0.009588735067362726, "2": 0.008696223743681791}, "score": 4.618140583829749}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33749381323268, "1": 0.17737247127168032, "2": 0.1670460593669436, "5": 0.16145881246853225, "4": 0.15648318795188565}, "score": 2.9576036357061763}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8184453441718396, "4": 0.13928219834632127, "3": 0.03210172859450295, "1": 0.0060592818047010295, "2": 0.003969986042628196}, "score": 4.760333355625215}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4961562905381266, "4": 0.24586686223102425, "3": 0.13959699704837844, "1": 0.07367534998348484, "2": 0.04456319432514872}, "score": 4.046413413376931}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5983920427223135, "2": 0.16652440562052967, "3": 0.131387855644458, "4": 0.06419413677172885, "5": 0.039258382133990105}, "score": 1.7791055163860994}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.31631677973955735, "5": 0.3094517176988267, "3": 0.25229652417139475, "2": 0.06094268174957888, "1": 0.06092129462194524}, "score": 3.7524883723372238}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5062100891074997, "2": 0.24616043028026527, "3": 0.18536420750807453, "4": 0.04327497307949049, "5": 0.018921669108200426}, "score": 1.8224568869375948}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5101303998323816, "4": 0.30342345738809967, "3": 0.12058856702146177, "1": 0.037807688408073005, "2": 0.027942107458260475}, "score": 4.220258292085052}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4543587476124168, "4": 0.3178088110888545, "3": 0.14681259051918413, "1": 0.04133455690264533, "2": 0.03954166709055946}, "score": 4.104474157491674}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.38478324624606763, "5": 0.2529860576186021, "4": 0.18928635589290085, "2": 0.09609797836613068, "1": 0.07673694536089062}, "score": 3.4457353728534845}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5718007428223891, "4": 0.33897270197211976, "3": 0.07491800725985835, "2": 0.009629166590112362, "1": 0.004608955593622439}, "score": 4.46383020119675}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8436066226044687, "4": 0.13468811938668487, "3": 0.02021189876951213, "2": 0.0009493617891725584, "1": 0.0004630898788181641}, "score": 4.820173088832856}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5428637018720952, "4": 0.33981521309965573, "3": 0.09563506858367403, "2": 0.01425664735476203, "1": 0.007338718814678377}, "score": 4.396735146285028}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.488935074649558, "4": 0.34697942317536024, "3": 0.13931405582784726, "2": 0.017040024837197788, "1": 0.007678607986564915}, "score": 4.292520594230889}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"3": 0.46799064620765857, "4": 0.21219046241898373, "2": 0.15060223847725726, "5": 0.10168918741666838, "1": 0.06730391309266397}, "score": 3.1303879211207075}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7218369980872685, "4": 0.19612873973321782, "3": 0.07180138596360396, "2": 0.006949900055586416, "1": 0.0032096117477886927}, "score": 4.626552943457743}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4172589653134864, "4": 0.338238706674274, "3": 0.1953207890531183, "2": 0.02967771652891566, "1": 0.019361484913452128}, "score": 4.104513164606499}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9170981065731041, "4": 0.07536331204786885, "3": 0.006427527116549936, "1": 0.000526300981868586, "2": 0.00044084355324684884}, "score": 4.908340708468161}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7922818018789655, "4": 0.17908086775382878, "3": 0.025265132394966663, "2": 0.0016971488210880598, "1": 0.0015505298000029245}, "score": 4.759065300760544}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2957706074314814, "5": 0.2162451632271364, "4": 0.20602363165503648, "1": 0.1598669935139032, "2": 0.12202724982115934}, "score": 3.1967657775258664}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3686022240456379, "4": 0.2768222155414956, "2": 0.14396698162052554, "1": 0.11405180545450132, "5": 0.09643957814045713}, "score": 3.097642222492419}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.83503967524218, "4": 0.13062281286767288, "3": 0.03029577545847267, "1": 0.002080087331192632, "2": 0.0019201297828356496}, "score": 4.794696373475622}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6507845785898415, "4": 0.25040021027503917, "3": 0.08447513907821565, "2": 0.00835868634498491, "1": 0.005957573569570384}, "score": 4.531732007791206}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30279723163908073, "4": 0.2755796173343917, "5": 0.15850944460924993, "1": 0.1398683438358398, "2": 0.12321227476659516}, "score": 3.189655819411253}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"2": 0.31674311386044984, "1": 0.30553000168624805, "3": 0.21279085437485099, "4": 0.13310041974230238, "5": 0.03166843612434205}, "score": 2.2685118888096065}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.42265611393310404, "4": 0.27016216207341887, "2": 0.16318358885418305, "5": 0.07527486485246572, "1": 0.06864609713658024}, "score": 3.1202453883664303}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6857199779492041, "4": 0.23748118017871073, "3": 0.05891495592080522, "2": 0.010138988897919646, "1": 0.00762103188860297}, "score": 4.583736253153922}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4242117449250189, "4": 0.39370203977775775, "3": 0.13867745637769321, "2": 0.02863933375227031, "1": 0.01465331484252092}, "score": 4.18431707763096}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.37963891564335084, "4": 0.35825559314076955, "3": 0.17695438349343223, "2": 0.047526715237080075, "1": 0.03751170355114468}, "score": 3.9950954383324975}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4078779873154412, "4": 0.4017152800013145, "3": 0.14140479714985302, "2": 0.027118950907769356, "1": 0.02179488869957856}, "score": 4.146863560332664}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.43945030496587395, "4": 0.32594947313862316, "3": 0.18157432590223083, "2": 0.031331352671185, "1": 0.021593505085382905}, "score": 4.130445938492736}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.36952794951745666, "5": 0.2879368769862745, "3": 0.24642314970774062, "2": 0.056567537540399775, "1": 0.039396314801877476}, "score": 3.810161579158733}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6027625746539617, "4": 0.29361514493678714, "3": 0.07926139429234877, "2": 0.012964016771574419, "1": 0.011283953575940999}, "score": 4.463773653449541}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3764974028148921, "3": 0.2777081880133976, "5": 0.24091974722846268, "2": 0.06276130235363467, "1": 0.04189049196002037}, "score": 3.711953282338558}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3346267993308524, "4": 0.2716327795615601, "2": 0.16608188983583838, "1": 0.11933328336245634, "5": 0.10820231686485254}, "score": 3.083299196787776}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5232342073268478, "4": 0.37810481630070814, "3": 0.08691244903078778, "2": 0.008100973818694084, "1": 0.00360392950369619}, "score": 4.409325878587597}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8263614089935161, "4": 0.14986114703971917, "3": 0.022089349714213703, "2": 0.0009715291348929588, "1": 0.0006709194989153463}, "score": 4.800352775110402}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9031948753902239, "4": 0.08092384918750117, "3": 0.01392451950066569, "2": 0.0009889903338990414, "1": 0.000922735435478925}, "score": 4.884564000966946}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5875952373346884, "4": 0.30222415555251847, "3": 0.08770048056258743, "1": 0.0112284448675904, "2": 0.011194552532830169}, "score": 4.44384567362964}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6171155472004166, "4": 0.2974254124156048, "3": 0.07625372593249478, "2": 0.005835321011106361, "1": 0.0033068030574215828}, "score": 4.519303585065854}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7049108486370874, "4": 0.21620654528966854, "3": 0.06725674285665313, "2": 0.006336032468725193, "1": 0.005240156052925404}, "score": 4.609291839070443}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.622868100066014, "4": 0.3000473750380441, "3": 0.06872066667699156, "2": 0.005232518856101829, "1": 0.003082582066261117}, "score": 4.534460708337306}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9580248422308936, "4": 0.038183026292867, "3": 0.003406921095827071, "2": 0.00016476225531562562, "1": 0.000143545141115302}, "score": 4.953931121350834}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7955638264834206, "4": 0.17179630108823452, "3": 0.028009641186078713, "2": 0.002593414322997419, "1": 0.0019258799476992796}, "score": 4.756673659892543}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6325029654075935, "4": 0.21307079448941038, "3": 0.08735174198619057, "1": 0.04158772613836611, "2": 0.025397251994587176}, "score": 4.369626629987078}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6880004410417112, "4": 0.20868519636947225, "3": 0.08417936996890868, "2": 0.010291092126763487, "1": 0.008763740214779898}, "score": 4.556992314833939}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7787277194094071, "4": 0.17361452689259516, "3": 0.04212753559310068, "2": 0.0030458873747371234, "1": 0.002440945047780134}, "score": 4.723216951184428}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8628673048792512, "4": 0.09754688936671112, "3": 0.02910538995892422, "1": 0.0062856520204861545, "2": 0.004153033283660485}, "score": 4.806632553464034}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25936623016003085, "4": 0.23664846713532559, "2": 0.17561517210577351, "5": 0.16900508090235764, "1": 0.15926783453495827}, "score": 3.0805156151028807}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2648632033642233, "4": 0.2601925097053635, "5": 0.21290355696762073, "1": 0.1339476268277368, "2": 0.12779300148517764}, "score": 3.2903985175742005}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.35426225740777423, "4": 0.3519951084251703, "3": 0.19708564470949588, "2": 0.05585925251246212, "1": 0.04051645869061722}, "score": 3.9238873227605047}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.44867357055369717, "4": 0.30951404755117673, "3": 0.18144135326489913, "2": 0.033928995693174646, "1": 0.026211996272781955}, "score": 4.1207660176959715}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.47207250165093145, "4": 0.37559952360730187, "3": 0.1149093870386691, "2": 0.020908761444157705, "1": 0.016356007793304508}, "score": 4.266318533052159}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5991654551858726, "4": 0.3019397152231729, "3": 0.07717609655602554, "2": 0.012501683046719204, "1": 0.009087128657100518}, "score": 4.4697856417410184}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.34717850766446656, "4": 0.21841256602981743, "2": 0.18563748730705001, "1": 0.14481639214738956, "5": 0.1036508748200929}, "score": 2.950428965946058}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3545234803796085, "5": 0.35332456390108735, "3": 0.19716477076681954, "2": 0.04971623198031274, "1": 0.045090148190744424}, "score": 3.9214426810625294}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3511502445329065, "4": 0.20455045708931724, "2": 0.18073906819883703, "1": 0.13584192302158205, "5": 0.1275914648753854}, "score": 3.007311399992747}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3040728707154677, "4": 0.2720850711513509, "5": 0.15664247496287048, "2": 0.14050396078009864, "1": 0.12654892331604178}, "score": 3.1917963500118853}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.36559657778144017, "5": 0.29134172152188165, "3": 0.21023857955732028, "1": 0.07505530779142879, "2": 0.05769042867944523}, "score": 3.7405362827176396}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3109932410491499, "2": 0.2797397982043029, "1": 0.21830666161918846, "4": 0.1438881668828348, "5": 0.046920199654261564}, "score": 2.521302715030221}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3673061068380546, "4": 0.31873418481726157, "3": 0.19089785205309218, "2": 0.06462868024995981, "1": 0.05825954717304625}, "score": 3.8723500890562916}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3908115517550467, "3": 0.24040583609842792, "5": 0.2272555099531504, "2": 0.08091553064338522, "1": 0.0605053371790965}, "score": 3.643464724729994}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.39682069507679557, "3": 0.2552784420340155, "5": 0.21845452711398486, "2": 0.0863297424550913, "1": 0.042902602094678}, "score": 3.6617364084452757}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4139213744420274, "5": 0.32908792983145846, "3": 0.16488035323927944, "2": 0.05025307197905555, "1": 0.041705786283811476}, "score": 3.9385747688291333}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4066620835278236, "2": 0.2942998892675004, "3": 0.18281236134700177, "4": 0.0694609677002757, "5": 0.046676782531486154}, "score": 2.0551074056162455}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.37994608040523464, "4": 0.22096633928333684, "3": 0.17589810508148085, "1": 0.14981674975963316, "2": 0.0730859158807125}, "score": 3.608313554854844}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2657582813667715, "5": 0.21947663469316878, "1": 0.19287566894929345, "4": 0.18057409262107155, "2": 0.14116173348015626}, "score": 3.092628517339784}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.33744751225782393, "3": 0.261020455804682, "5": 0.23788043630651398, "2": 0.10140074912822772, "1": 0.062147573775088644}, "score": 3.5875731684762577}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.32148734449947647, "4": 0.28979218973313925, "3": 0.20180269829847797, "1": 0.09530776424735056, "2": 0.09149849087555577}, "score": 3.650725423280387}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5191638719941234, "2": 0.1907858278962437, "3": 0.1702232956499734, "4": 0.06533430735734955, "5": 0.05433497242321895}, "score": 1.9447242372882707}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.39716676242810905, "2": 0.24759951425178842, "3": 0.2035723314808519, "4": 0.09700945800751178, "5": 0.05452314437649606}, "score": 2.1640150416051145}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4590117684158748, "2": 0.24602520228112168, "3": 0.2076903106264002, "4": 0.058962761226373395, "5": 0.028191530021523612}, "score": 1.9511728722566533}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.3461934348085483, "3": 0.2551424148788685, "2": 0.2311667886985097, "4": 0.1276246812566169, "5": 0.039721391805445316}, "score": 2.283405393991579}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7363849773157697, "2": 0.16912303689146507, "3": 0.06884747007112745, "4": 0.019163995399898166, "5": 0.006406232079459701}, "score": 1.3899638612810608}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.37074403021825136, "4": 0.30658764811493483, "3": 0.17184695410368295, "1": 0.08444463216786027, "2": 0.06621577178026429}, "score": 3.8131015522006626}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8631644843996338, "4": 0.08657444494293218, "3": 0.03343195833828859, "1": 0.010560665308391694, "2": 0.006180529077073647}, "score": 4.785758554250484}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6368002320830528, "4": 0.21617286293383606, "3": 0.10765248191785091, "2": 0.021782462618187084, "1": 0.01748841705089143}, "score": 4.433162424884723}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4757603823131817, "4": 0.3094467974556313, "3": 0.14399453953801628, "2": 0.037948488676676224, "1": 0.03268607280197728}, "score": 4.1578364878817}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8804241667216613, "4": 0.09398357932535521, "3": 0.020673191803721815, "1": 0.0025614699142962063, "2": 0.0022884658967309225}, "score": 4.847548221286604}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3897948359282093, "2": 0.27660369533194346, "3": 0.21876355280140947, "4": 0.08492633884769983, "5": 0.029790009302135875}, "score": 2.088202145014727}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3358288244079786, "4": 0.3243010590581421, "3": 0.19889989918203324, "1": 0.0736996668610435, "2": 0.06701565702174388}, "score": 3.7817429783099232}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.692369968272197, "4": 0.2249104401041064, "3": 0.06945229256718329, "2": 0.007424143162071242, "1": 0.005646622501020113}, "score": 4.591245721405785}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6937875841760676, "4": 0.22488871480494121, "3": 0.058862433097654196, "2": 0.011191060377244525, "1": 0.011058824195245898}, "score": 4.579489052074634}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5141727913899986, "4": 0.2638579206664571, "3": 0.1423371414302857, "1": 0.04285073419554804, "2": 0.0365434871066806}, "score": 4.170236976828344}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"3": 0.37810796592694607, "4": 0.22685777493428433, "2": 0.17520883038659502, "1": 0.11373537509618183, "5": 0.10596592487435515}, "score": 3.036114526956266}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3211958234344954, "5": 0.2901601984716812, "3": 0.22550422140839793, "1": 0.08363023178828441, "2": 0.07937427148127998}, "score": 3.654970072259569}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.30413384343835725, "5": 0.2758926881285705, "3": 0.2387916176614507, "1": 0.09367244592059557, "2": 0.08741230646475671}, "score": 3.581218456763772}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3182758243442751, "4": 0.2804106620823105, "5": 0.1433430027774532, "2": 0.134012352559499, "1": 0.1238931844914594}, "score": 3.185309986378601}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7216659069062554, "4": 0.18396488168443442, "3": 0.07124775279856685, "1": 0.012622330143078734, "2": 0.010366026528852717}, "score": 4.591897893377934}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3643293546433124, "4": 0.22612966619782146, "2": 0.20823144532164461, "1": 0.12989101841471334, "5": 0.0712719455171236}, "score": 2.900645512703195}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.37147552446353244, "3": 0.3110627558065091, "5": 0.21058681248975436, "2": 0.08112622531783681, "1": 0.025652449880910415}, "score": 3.660281564606282}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4071743324463013, "3": 0.27426952176226876, "5": 0.23045337837927274, "2": 0.061346344129008766, "1": 0.026672489515006507}, "score": 3.753453006195753}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4084331195981208, "5": 0.25351484436816174, "3": 0.23432297036755712, "2": 0.06709585569678975, "1": 0.03646936813214549}, "score": 3.775555284776091}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32188942275782834, "3": 0.3143399296928229, "2": 0.15781422955753735, "5": 0.1117470549221435, "1": 0.094141924524552}, "score": 3.1992988944229572}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.23239269206552135, "4": 0.21732807517420333, "3": 0.21550895840015766, "5": 0.18401770558447403, "2": 0.15052268127530974}, "score": 2.9700485354694868}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.340129823645706, "5": 0.32755414805534766, "3": 0.23779379224674127, "2": 0.0545683191489598, "1": 0.03965014396549712}, "score": 3.861631252933406}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3441291004525312, "2": 0.2070519605637779, "4": 0.19800987020694957, "1": 0.1616312941055413, "5": 0.08897673036577938}, "score": 2.84561774449032}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6100182769808202, "4": 0.2346238231416573, "3": 0.09758626723717928, "1": 0.03091468392577795, "2": 0.026606593978141753}, "score": 4.366566541679948}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3353158015558129, "3": 0.25892720980670514, "5": 0.20369182278028336, "2": 0.10545487950133932, "1": 0.09650541096818631}, "score": 3.4442803397515345}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"1": 0.28311406670074074, "3": 0.24375996204771258, "2": 0.22080045585955724, "4": 0.1813983930391375, "5": 0.07064667739814742}, "score": 2.5355329011198866}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3415460372930395, "4": 0.25320959360365125, "2": 0.19466461972278185, "1": 0.13680857404365748, "5": 0.07357164394280993}, "score": 2.9320575570288128}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4308060026797381, "4": 0.36333176825186836, "3": 0.16260983464921216, "2": 0.026116541276886937, "1": 0.016875878235374755}, "score": 4.1653784450164775}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5862156228516523, "4": 0.3145341889018781, "3": 0.08120031926396543, "2": 0.01201709211129461, "1": 0.005919182090616973}, "score": 4.463276198851409}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.41811707581175317, "3": 0.2776248880526124, "5": 0.17243647003468726, "2": 0.08377971208744564, "1": 0.047740609074216456}, "score": 3.5839049840667223}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7571699697761937, "2": 0.19315430533634342, "3": 0.039060962978892944, "4": 0.008696679437745044, "5": 0.001824095556992882}, "score": 1.3046912888292446}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.4485240839678723, "2": 0.26832860808710707, "3": 0.18726853053734957, "4": 0.07576051745046997, "5": 0.020039915887596602}, "score": 1.9503813418055957}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3520778017880946, "1": 0.28855155754665407, "2": 0.2628755375692186, "4": 0.06417808382562681, "5": 0.031930896359697765}, "score": 2.28778622182542}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.33081704187638383, "3": 0.2909355249806128, "5": 0.1558056004166416, "2": 0.12464793942944855, "1": 0.09766146689826312}, "score": 3.3225000770074544}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.37806884890035, "2": 0.22186555248684622, "3": 0.21781303974598873, "4": 0.12071459965395591, "5": 0.061322491174284684}, "score": 2.2651980053704555}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"5": 0.41617861828365466, "4": 0.36255873145644246, "3": 0.15653591601945088, "2": 0.03551901827124926, "1": 0.029154465136256497}, "score": 4.101146656456642}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9201854345094365, "4": 0.06808107531282671, "3": 0.010734025817743038, "1": 0.0004953031294985884, "2": 0.00048047007998223805}, "score": 4.907026047633847}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8900997000517059, "4": 0.09222615609367804, "3": 0.01601067646838691, "2": 0.0008118331655970452, "1": 0.0007887459333013402}, "score": 4.8701538419370545}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9898458985497753, "4": 0.00941281048449155, "3": 0.000604326465654345, "1": 4.304424576584871e-05, "2": 0}, "score": 4.989205345764466}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9389999293626705, "4": 0.055313913596149254, "3": 0.005117076495419304, "1": 0.00027178370777631065, "2": 0.0002578586477809563}, "score": 4.932588564053531}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3595254182032084, "3": 0.232243961877674, "2": 0.22054696799454002, "4": 0.10455165745552641, "5": 0.08295220337583772}, "score": 2.3307379324474735}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7821628124840341, "4": 0.18631933919978733, "3": 0.02765557897829472, "2": 0.0022076117585895887, "1": 0.001560986009520337}, "score": 4.745478882137122}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3537207920770993, "5": 0.3451435022095044, "3": 0.23142644225177347, "2": 0.04151661377206144, "1": 0.02809669008920568}, "score": 3.9463886176191636}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6490083476721374, "4": 0.2848887003716477, "3": 0.05580943711332456, "2": 0.006142677849871896, "1": 0.0040586454258157295}, "score": 4.568790056228315}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7509773781314383, "4": 0.20209659556778936, "3": 0.03922090435357695, "2": 0.004298863042352548, "1": 0.0033421645935724467}, "score": 4.6931766825944985}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5478089139580251, "2": 0.24249412395780795, "3": 0.13318256804142758, "4": 0.059878683817976154, "5": 0.01658451251734549}, "score": 1.7548720092802423}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.32659882373450744, "4": 0.2846217708333403, "3": 0.2641852810073958, "2": 0.07396913258717913, "1": 0.05047548026096861}, "score": 3.7630134045303243}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6835121820047523, "4": 0.2160737487875054, "3": 0.08420771793488947, "2": 0.009062366408871831, "1": 0.007011286999457564}, "score": 4.560220210279314}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6546639358847557, "4": 0.24390789608794033, "3": 0.07702192171882964, "2": 0.014827400867393904, "1": 0.009473223869421872}, "score": 4.519622424159983}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5870381029100222, "4": 0.28872153560401986, "3": 0.08997010774391778, "1": 0.01768479585128051, "2": 0.016525913746125255}, "score": 4.410986251944842}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5460085412743351, "2": 0.260667872801477, "3": 0.1125955257338361, "4": 0.06371890363930727, "5": 0.016906611847248593}, "score": 1.7447184495088819}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7646873893842495, "4": 0.1933392038170167, "3": 0.03518142621459541, "2": 0.003646756998112495, "1": 0.0030630154716548546}, "score": 4.713082023887041}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4026226532388922, "4": 0.37453830433008506, "3": 0.18802999142860638, "2": 0.024759614518664524, "1": 0.00998285657155416}, "score": 4.135133860258845}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5216232995420047, "4": 0.38919181080063187, "3": 0.07766011297042348, "2": 0.007470801423372975, "1": 0.003968401143647516}, "score": 4.417152077715816}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4752169416256857, "5": 0.31243516604071325, "3": 0.1686528868867787, "2": 0.02795478207774554, "1": 0.015646553654759032}, "score": 4.040936888580825}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3709577144849884, "3": 0.301149608352393, "5": 0.16130233787510445, "2": 0.10837259885725022, "1": 0.05808872476293205}, "score": 3.4690728596000913}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.41071275572674243, "4": 0.39740582150135983, "3": 0.1517321626906208, "2": 0.026049479286095276, "1": 0.014019150376952163}, "score": 4.164837474247563}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5657052478156444, "4": 0.30550821817371926, "3": 0.09426064638889871, "2": 0.02057655413821417, "1": 0.01372074991020355}, "score": 4.389218212309477}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5922268647642662, "4": 0.29637717379902967, "3": 0.08874753727728146, "2": 0.012841110460464948, "1": 0.009689207904716106}, "score": 4.448782486663936}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.48203690570982427, "4": 0.30990425005613886, "3": 0.1577119359782545, "2": 0.03046744020047933, "1": 0.01980392358607597}, "score": 4.203993729170379}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6185904419189429, "2": 0.2844651581144475, "3": 0.07335900605458241, "4": 0.01953017838966174, "5": 0.003920291365532446}, "score": 1.5055230781298035}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3495881610666472, "5": 0.32517027850379177, "3": 0.2029034558527399, "1": 0.061394747075816325, "2": 0.06087956564884911}, "score": 3.81631173231109}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3854786384866784, "5": 0.3115128779112565, "3": 0.2311217155694864, "2": 0.039652340644320244, "1": 0.03217888457743985}, "score": 3.9045445254554463}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5721225856423606, "4": 0.30408737533733327, "3": 0.09784185776473624, "2": 0.014030490846280818, "1": 0.011789802689314446}, "score": 4.41090288755054}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2775750033425048, "2": 0.24670238201023167, "1": 0.23579646087579634, "4": 0.17713268402120913, "5": 0.06271767958732033}, "score": 2.5842412290090295}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6900729654173384, "2": 0.24640203214871098, "3": 0.05206776165291924, "4": 0.009588255642595078, "5": 0.0018058561108534755}, "score": 1.38655014936079}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3669590564344773, "4": 0.2850177556864161, "2": 0.14970073166900422, "5": 0.13132435810363158, "1": 0.06693231460455286}, "score": 3.264118485654477}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3815093194941131, "2": 0.23022168187725328, "4": 0.19867369970735235, "1": 0.1409971502219587, "5": 0.048543824067931444}, "score": 2.7835336060649856}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3275265691571693, "3": 0.2849173616165416, "5": 0.16993637103916934, "2": 0.12902457356628605, "1": 0.08851803167339714}, "score": 3.361366533133572}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30190312234726097, "4": 0.2745055224554857, "5": 0.17556830667080897, "2": 0.13336651353342183, "1": 0.11458076883457483}, "score": 3.263134021248479}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"1": 0.48740221172436676, "2": 0.21373428378938034, "3": 0.17855885718201508, "4": 0.08095065560524983, "5": 0.03901517913440553}, "score": 1.9700933613264175}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.29950466068354, "3": 0.2596554030330431, "5": 0.2143322924073008, "1": 0.12081779436302052, "2": 0.10537090759477948}, "score": 3.3812843567414843}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.2955511383756026, "5": 0.24848388118398693, "3": 0.2434287955407481, "1": 0.11366117560432164, "2": 0.09858192013084938}, "score": 3.4667514291904897}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4550522006083604, "4": 0.35504859910116365, "3": 0.13664134576604528, "2": 0.028533244437944576, "1": 0.024580871987138337}, "score": 4.1876287194005215}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3713299123156258, "4": 0.3213261590168479, "3": 0.16826358008246067, "1": 0.0793652788857613, "2": 0.05938870038013981}, "score": 3.846142880572286}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5414926803454728, "2": 0.29128217735962325, "3": 0.12022175298521662, "4": 0.03633688637734854, "5": 0.010593128953269765}, "score": 1.6831589843682009}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4704711686230317, "4": 0.34244712936950616, "3": 0.1452716995378128, "2": 0.027711840562296395, "1": 0.013981615372947141}, "score": 4.227857497843496}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.46662557943073524, "4": 0.40169057527127267, "3": 0.11759433693402878, "2": 0.010045430746019861, "1": 0.003761759044481519}, "score": 4.317744809132462}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7651796470342345, "4": 0.18559177042419153, "3": 0.04027008070594392, "2": 0.005154951860325391, "1": 0.0036442211959988296}, "score": 4.703779131289533}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.376387816607553, "5": 0.3046291633495253, "3": 0.2191710289153788, "2": 0.06326565323606512, "1": 0.03625163482781587}, "score": 3.8501277556690066}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"4": 0.31304823339835014, "3": 0.2688872048881234, "5": 0.17572173258569887, "2": 0.13656513482026247, "1": 0.10550039310069705}, "score": 3.3170136858257644}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.501920805351247, "4": 0.4130460049888248, "3": 0.07403078194801312, "2": 0.007787176006778891, "1": 0.0030441730227805035}, "score": 4.403252132099709}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4047929609975959, "5": 0.3440528154874617, "3": 0.19918098404696707, "2": 0.03619524942918382, "1": 0.0156170189664899}, "score": 4.025634402079848}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9330623210090778, "4": 0.06156596976334472, "3": 0.004718325543779017, "2": 0.0002882037104256341, "1": 0.0002855129987877816}, "score": 4.926984899130484}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3693571451475908, "5": 0.2734503525290564, "3": 0.23306707297422002, "2": 0.07893958230962765, "1": 0.04498880040843919}, "score": 3.747487957062899}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31474918355771386, "2": 0.31306914571880484, "4": 0.1712999098366221, "1": 0.16515279554171283, "5": 0.03558291044719839}, "score": 2.599032430651367}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.46297908439923885, "5": 0.3393693963860177, "3": 0.16497451030752147, "2": 0.023646284026609374, "1": 0.008975905125992728}, "score": 4.100180094495496}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3581112810359188, "3": 0.2729276601626673, "4": 0.23210259157384353, "2": 0.0804889798662637, "1": 0.05624365748934457}, "score": 3.75544391621198}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8658957488989609, "4": 0.11303446576556447, "3": 0.01857525426336741, "2": 0.0014971908400596063, "1": 0.0009484125225410075}, "score": 4.841522049134216}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6952890990866459, "4": 0.22905516711692323, "3": 0.05792094589372248, "2": 0.009566862258062771, "1": 0.008038868013857824}, "score": 4.594194509970909}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3370839061319592, "3": 0.23762138294101753, "5": 0.17830384313977304, "1": 0.12867289405055266, "2": 0.11827433263104685}, "score": 3.318085353275862}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.727021651435549, "4": 0.21187580530607802, "3": 0.04850761902876374, "2": 0.0063597449794804625, "1": 0.00620140127730198}, "score": 4.647212200132027}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4893772081809978, "2": 0.30360164960313857, "3": 0.16007687666263226, "4": 0.031803815885360916, "5": 0.01510137771378202}, "score": 1.779602822045284}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8458119799484642, "4": 0.12903950257307406, "3": 0.019732726064347155, "1": 0.0029983165434565146, "2": 0.0023749687487575}, "score": 4.812368897407614}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7671108530205277, "4": 0.1824197005085852, "3": 0.040415560794199376, "1": 0.005115086339772958, "2": 0.0048976930051959355}, "score": 4.701583486720151}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.34160297776331255, "5": 0.2682075655283929, "3": 0.2136547253262524, "1": 0.09472484105892194, "2": 0.0813618979265321}, "score": 3.6074786746030334}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3940970816140683, "4": 0.3402620578062012, "3": 0.18306672044368516, "2": 0.04184877724651567, "1": 0.04053833132517207}, "score": 4.005718882313341}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.23594078888285672, "5": 0.22440873052668986, "3": 0.21415723302142678, "1": 0.20693819607159814, "2": 0.11847930203905273}, "score": 3.15241410103959}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.42440478396659886, "4": 0.38684236287753104, "3": 0.13310344115612346, "2": 0.02950493622421494, "1": 0.025878589820384584}, "score": 4.15469683261599}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.36515074889275206, "4": 0.23771328889867246, "3": 0.16707651463947992, "1": 0.14189069092977524, "2": 0.08800083288028727}, "score": 3.5963327103746994}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"1": 0.389379687885333, "2": 0.3137131643157231, "3": 0.1758623662177198, "4": 0.09450184697163956, "5": 0.026375442765744665}, "score": 2.054621849287151}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5390457404421178, "4": 0.3908561849827659, "3": 0.06074192059056559, "2": 0.005626574269019827, "1": 0.003569577633977396}, "score": 4.456414965756154}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3693738774052488, "5": 0.3172598578681317, "3": 0.22196392728942765, "2": 0.05158481153092541, "1": 0.039609947213701806}, "score": 3.8732701594611405}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8527433466004599, "4": 0.12213509632243737, "3": 0.0202699152415417, "1": 0.0028028419343159154, "2": 0.0019221166082674023}, "score": 4.820324593760286}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5547099580199325, "4": 0.33806124557087786, "3": 0.08523562489240094, "2": 0.011028604194579928, "1": 0.010812216788913883}, "score": 4.415043706501656}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4441729523846945, "5": 0.27255934739113763, "3": 0.21280130266230415, "2": 0.046725557228875496, "1": 0.023665949355282066}, "score": 3.8953012412128265}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8001734438503815, "4": 0.17360206181706583, "3": 0.023327170078143677, "2": 0.001617804978593707, "1": 0.0011952131993665381}, "score": 4.770089947478935}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5229070528119357, "4": 0.3638183406746337, "3": 0.09790803101211656, "2": 0.009723392488042906, "1": 0.005541045930076416}, "score": 4.388968827174966}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8354068310261128, "4": 0.1417957694436767, "3": 0.02105424239931874, "2": 0.001031887427244579, "1": 0.0006455589676191126}, "score": 4.810405389204052}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8322148652497534, "4": 0.14673896778990386, "3": 0.01846065810902187, "2": 0.0012997980145622492, "1": 0.0011985382376616324}, "score": 4.807629399552489}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"1": 0.441493889213471, "2": 0.25134414080911954, "3": 0.21163884888178552, "4": 0.07509357323292941, "5": 0.020390866479139937}, "score": 1.981503990120341}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3397098867100287, "1": 0.21594798726369321, "2": 0.20806567581676894, "4": 0.16375180199134948, "5": 0.07242518362127069}, "score": 2.6686075570739876}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.42630556547276666, "4": 0.3080929980077946, "2": 0.13222310417552027, "5": 0.06835572221527901, "1": 0.06497950932105467}, "score": 3.1826301911294506}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.38396873460834124, "5": 0.2945057651561798, "3": 0.20079871310996797, "2": 0.06112426841068967, "1": 0.05932452401728236}, "score": 3.793427517118087}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.43457870997154363, "2": 0.2712064879723965, "3": 0.20850955738851698, "4": 0.0660877020575907, "5": 0.019546297435025166}, "score": 1.964742631919874}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3382706379153149, "3": 0.259946977878487, "4": 0.24331190476381706, "1": 0.08039582757316578, "2": 0.07795338181549444}, "score": 3.68119075167167}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4320234974378433, "4": 0.29307424680532346, "3": 0.19690866247861083, "2": 0.045219720185488935, "1": 0.03250854178580675}, "score": 4.047162282860984}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5251246794073946, "4": 0.2745772326628965, "3": 0.15316755899598095, "2": 0.026835007335438015, "1": 0.020091976956384667}, "score": 4.258063702355269}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6429467134188249, "4": 0.22646956815892172, "3": 0.09467398747468271, "1": 0.01943962053392858, "2": 0.01637538968805772}, "score": 4.45724639567661}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.358812073391668, "4": 0.20984764742733958, "3": 0.19320534344565063, "1": 0.15678299926482456, "2": 0.08104294334858958}, "score": 3.5330275541804763}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.32852580175061463, "3": 0.2580173366500675, "5": 0.2192414379569531, "2": 0.10216171295742306, "1": 0.09194734525165386}, "score": 3.4810034363427094}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.44016195070799546, "3": 0.24962746811602357, "5": 0.24095388797545977, "2": 0.04503327130824973, "1": 0.02415533529729677}, "score": 3.8287822137149794}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3523520010750106, "5": 0.32509198692741226, "3": 0.24547000952600562, "2": 0.049167089102108055, "1": 0.02778340719412969}, "score": 3.897923745651983}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7940130199083393, "4": 0.17308660548633725, "3": 0.028244026360929365, "2": 0.0023216417330721205, "1": 0.00230213805204635}, "score": 4.7542438604855795}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8404054290110252, "4": 0.14020682852059504, "3": 0.016890718653752003, "2": 0.001317499048170831, "1": 0.0010046316721701685}, "score": 4.818008881348835}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8101090830101446, "2": 0.15297989063286513, "3": 0.024106566661966318, "4": 0.00837163896024835, "5": 0.004369555461964009}, "score": 1.243801586859303}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.27303111935014657, "3": 0.25259390459955167, "5": 0.20410236944460317, "1": 0.14839462033764206, "2": 0.12179118488643875}, "score": 3.26267823351122}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3598168956928468, "4": 0.25598874508007496, "2": 0.15741047421650553, "5": 0.13415940452775885, "1": 0.09245304361032465}, "score": 3.1820221980147885}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4290839463754259, "4": 0.2579781725909913, "3": 0.13715183255548058, "1": 0.12083539879811117, "2": 0.05485552873413236}, "score": 3.819697709432928}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5075537816431118, "4": 0.3155569203877535, "3": 0.1305342022958283, "2": 0.02354143073758879, "1": 0.022717607372126972}, "score": 4.261809044494666}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.38973174884184153, "2": 0.22767261068368275, "1": 0.19388517046174464, "4": 0.13725852329645982, "5": 0.05131805189050097}, "score": 2.6244013847591425}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29460797638931235, "4": 0.29066298793740786, "5": 0.29038150095678394, "2": 0.07784432343962873, "1": 0.0463595392075608}, "score": 3.700963296843591}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.418650682538921, "4": 0.32588318175784875, "3": 0.19768152556210297, "2": 0.03741872617513817, "1": 0.020159379802844005}, "score": 4.085671256689178}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3523276896256911, "5": 0.28576645290343144, "3": 0.2366715888200406, "2": 0.07630906808359665, "1": 0.04875515224723511}, "score": 3.750168787796572}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3293551918798836, "3": 0.27857167273372596, "5": 0.2117067958571827, "2": 0.11317245196826722, "1": 0.06710273337447364}, "score": 3.5054369375698893}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3139602793377219, "3": 0.27658480394470053, "2": 0.16157684969423322, "5": 0.12921697639748564, "1": 0.11858318281326599}, "score": 3.1736645466368816}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7944132000596003, "4": 0.1797099709657324, "3": 0.023157520305340695, "2": 0.0016139280319474594, "1": 0.0009919235700184433}, "score": 4.765138863391873}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6426923433065758, "4": 0.28426598847505397, "3": 0.06627759317986819, "2": 0.004637928297764373, "1": 0.0018820343238882583}, "score": 4.561629891389677}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7419745244718926, "4": 0.22714827066291593, "3": 0.02747260644634139, "2": 0.002047946899744785, "1": 0.0011461325548158122}, "score": 4.707116487992299}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5448571874684598, "4": 0.35820357820502124, "3": 0.08491478965097972, "2": 0.008297193117411429, "1": 0.0035985701247118274}, "score": 4.432607969822185}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3286810668704377, "4": 0.20225251257616203, "2": 0.19161303181929865, "1": 0.18044551549307805, "5": 0.09689790311496514}, "score": 2.8435270486504525}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.44427035242381047, "2": 0.2881833123822468, "3": 0.16720910902515276, "4": 0.0757086544080524, "5": 0.024467259550845236}, "score": 1.9477494154127146}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3306049899802358, "4": 0.3252554192271385, "3": 0.24924834751292005, "2": 0.0526011498085106, "1": 0.042183252369214636}, "score": 3.8495885156139082}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6147528880321009, "4": 0.30920917170956086, "3": 0.06485816306777116, "2": 0.006266283771334538, "1": 0.00483030049001112}, "score": 4.522914758762142}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.29891629339108183, "2": 0.2692825173865215, "3": 0.2670448118554346, "4": 0.12142447675048607, "5": 0.043107684633697026}, "score": 2.340376843794963}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3468653550948403, "2": 0.3186879079734063, "3": 0.2153953720212894, "4": 0.09113562476038453, "5": 0.02760796668231119}, "score": 2.1336663054364995}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.30160761333914893, "3": 0.2684980037188401, "5": 0.21584504780608277, "2": 0.11757874495872211, "1": 0.09641061204210953}, "score": 3.4229231060475636}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5328450287006297, "4": 0.342328081200348, "3": 0.10703405758269681, "2": 0.01194440154904299, "1": 0.00578956800914616}, "score": 4.384576101279359}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8708432011302023, "4": 0.10480234828988554, "3": 0.021387049578941813, "2": 0.0015473442572326683, "1": 0.001354584654072055}, "score": 4.842352859676538}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.38724589504983475, "3": 0.24710290739263333, "5": 0.21978416112607815, "2": 0.0890501575515372, "1": 0.05675042123528381}, "score": 3.6243047071002534}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4330862409613882, "4": 0.4181474154874842, "3": 0.11706622250361493, "2": 0.0175744172452528, "1": 0.014021201528690415}, "score": 4.238832537924413}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8448533052079181, "4": 0.12429635563528393, "3": 0.028451107250304794, "1": 0.001203436578113129, "2": 0.001118339816583875}, "score": 4.810617995421813}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4202175607649684, "3": 0.3164879850644978, "5": 0.18841601785351633, "2": 0.048577141413833014, "1": 0.026224754133904165}, "score": 3.6960762250000987}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9564067975395724, "4": 0.040528242590100384, "3": 0.00279289859365028, "1": 0.0001464134630413831, "2": 9.060383653055811e-05}, "score": 4.953026848734805}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6036488042935223, "4": 0.3389342307537289, "3": 0.04983865954645266, "1": 0.003781967129819726, "2": 0.0036693086991971997}, "score": 4.535193611377431}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2702611135740841, "3": 0.23178380888962608, "5": 0.22416591709364816, "1": 0.14358881720749705, "2": 0.12981671603391487}, "score": 3.301714343141501}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.47402751995292586, "4": 0.27509959039060233, "3": 0.1418196924078271, "1": 0.06432441598403293, "2": 0.04443528579758321}, "score": 4.050378793945491}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4030027069743794, "4": 0.30138519945023806, "3": 0.16701312113185315, "1": 0.07598701565017431, "2": 0.05224638380531281}, "score": 3.903500493668504}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.34344829591600307, "5": 0.27778723501156044, "3": 0.22055486371732677, "2": 0.08853754319766893, "1": 0.06950147525124874}, "score": 3.6715968378657378}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.38177818750733394, "4": 0.25650744229420797, "3": 0.1573841259085366, "1": 0.13343674949079046, "2": 0.07040264820340394}, "score": 3.6831229787124555}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.37567442561979164, "5": 0.28886483477957187, "3": 0.19330945120307164, "1": 0.07326904975363005, "2": 0.06873728534330983}, "score": 3.7382357200326237}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.43773989151324494, "5": 0.3534899231473155, "3": 0.15966046696858044, "2": 0.03179674350318606, "1": 0.017252900581295767}, "score": 4.078481982177548}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.36737847326896106, "5": 0.3278581610331149, "3": 0.2414792333152357, "2": 0.04338461039302543, "1": 0.01982401494919186}, "score": 3.9401331417149614}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7764976677029741, "4": 0.19001294073678487, "3": 0.03012341809257153, "2": 0.002212792469973417, "1": 0.001109085252787498}, "score": 4.738653980409588}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.49394836082552235, "4": 0.364898188472946, "3": 0.1156310800865201, "2": 0.016372969584311902, "1": 0.00905595795781057}, "score": 4.318433223075822}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3099119047856507, "4": 0.2519863902181453, "2": 0.19226798978879925, "1": 0.13957399335882092, "5": 0.10605152691586402}, "score": 2.9926719418788643}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.806871157171131, "4": 0.15902394350776566, "3": 0.029376997759390344, "2": 0.002593769645098679, "1": 0.002044391681496737}, "score": 4.766242207832941}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.44393834003003485, "5": 0.31690009896321497, "3": 0.197486628644251, "2": 0.02793353334124709, "1": 0.013663899459782344}, "score": 4.022556453372367}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8760354156839618, "4": 0.11020535389546932, "3": 0.012280746109576558, "2": 0.0007336046488540834, "1": 0.000635638024827943}, "score": 4.8604745458504475}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6476522033128509, "4": 0.25770225780303846, "3": 0.07467889178007023, "2": 0.011417306051491525, "1": 0.008372891451120787}, "score": 4.525112680999703}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4067043379133795, "2": 0.23399474994701422, "3": 0.219285487986516, "4": 0.09683023387946513, "5": 0.04305922436918304}, "score": 2.135436351302102}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7761638144362296, "4": 0.15157808110002943, "3": 0.04663280106251624, "1": 0.016556768300589997, "2": 0.00899731301599772}, "score": 4.661913225279702}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6395942295691177, "4": 0.284602616432716, "3": 0.06406683138958554, "2": 0.00653452251744998, "1": 0.005117709516933363}, "score": 4.547151234855344}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6982446333806447, "4": 0.24383768511201157, "3": 0.048896908762025286, "2": 0.004598503750637096, "1": 0.004370866525252256}, "score": 4.627070350506111}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9232131863705401, "4": 0.061572114353737065, "3": 0.012438851737386446, "1": 0.0016006499715621966, "2": 0.0011088646776676414}, "score": 4.903814607997296}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.41046065549741667, "3": 0.24623350153921086, "5": 0.20845656099515578, "2": 0.09147860126571836, "1": 0.04312604810680655}, "score": 3.6498020427688047}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.48457011108439496, "4": 0.27272020485438386, "3": 0.1727366152153181, "2": 0.03774669336891528, "1": 0.03215849927804741}, "score": 4.139874105419711}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5071189943851945, "4": 0.2628089859089018, "3": 0.17653922311802886, "2": 0.029795655043815768, "1": 0.023616161311152125}, "score": 4.200164193156786}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5764282528558414, "4": 0.30782679748875613, "3": 0.08895256756726862, "2": 0.014634160836157891, "1": 0.011997391833809498}, "score": 4.422283103660692}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9156015390367445, "4": 0.072210269958965, "3": 0.010238511820105862, "1": 0.0010249504592488106, "2": 0.0008558246935936697}, "score": 4.90063858408093}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5079782232198301, "2": 0.3466827438845989, "3": 0.1187186821634416, "4": 0.01890089506691625, "5": 0.007644682277352879}, "score": 1.6714517292422224}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30498795346219765, "4": 0.2558224064616804, "5": 0.189718041715098, "2": 0.13479120869861508, "1": 0.11465225515078732}, "score": 3.2711704001384607}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6931885561531862, "4": 0.22695325677394682, "3": 0.06647978250671087, "2": 0.00761169803451075, "1": 0.005707731612539883}, "score": 4.594397237268818}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9076823921065459, "4": 0.07738534944184257, "3": 0.013111284596549722, "2": 0.0009051187567003513, "1": 0.0008806828372202577}, "score": 4.890150130077765}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.33608583175142565, "3": 0.3096492728181953, "5": 0.22504036339500597, "2": 0.0802040393033125, "1": 0.04893012593037852}, "score": 3.6081572246006752}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.30307853973951754, "3": 0.26053553925799877, "2": 0.1541200707756469, "5": 0.1424950951308791, "1": 0.13963828198408254}, "score": 3.1546925878659624}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30735203332033545, "2": 0.22702260158577195, "1": 0.22231842009918035, "4": 0.14907117537683268, "5": 0.09397805325335898}, "score": 2.665281577684481}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30563536659469576, "5": 0.25867743970247115, "4": 0.24140653486338565, "2": 0.10594882335421027, "1": 0.08810714925618729}, "score": 3.4767054015407832}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4773813316749683, "4": 0.30803070790133946, "3": 0.14322135621436807, "2": 0.03925998390865715, "1": 0.03201288503126647}, "score": 4.159616314227702}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8175577880196546, "4": 0.1598655387308815, "3": 0.018750366126681788, "2": 0.0019393546808122797, "1": 0.0018406465191014966}, "score": 4.789443328875938}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.320839173030644, "3": 0.30837268847055904, "2": 0.15215672558019083, "5": 0.1254396139439462, "1": 0.09299326572591732}, "score": 3.2336215255269503}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5465006948017114, "4": 0.29457557129422246, "3": 0.12009516605981745, "2": 0.021016248549272188, "1": 0.017699315720649072}, "score": 4.331312523980832}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.45248436451371277, "5": 0.26233876873505774, "3": 0.23250040779483144, "2": 0.03816575238198657, "1": 0.014445360335942872}, "score": 3.91016490478287}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8814591937921482, "4": 0.10359295017251584, "3": 0.012886790300265254, "1": 0.0010781264638193365, "2": 0.0009456628006223565}, "score": 4.863478885944511}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6473651174028109, "4": 0.2823848844822704, "3": 0.05992470029555118, "2": 0.005983659150954566, "1": 0.004281257945809319}, "score": 4.562663298984497}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"1": 0.23373889966619338, "2": 0.23282764969731579, "4": 0.22353307260825547, "3": 0.22352925022539535, "5": 0.08617014560419689}, "score": 2.6955067170574685}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2864019600984205, "3": 0.25029831812591613, "5": 0.2393968365553696, "2": 0.12018473038706996, "1": 0.10361322529672078}, "score": 3.437830393568912}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3862387412740751, "4": 0.36275743181439973, "3": 0.1885478232551887, "2": 0.03709222871161501, "1": 0.02522397620720528}, "score": 4.047841220116213}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7572441912141644, "4": 0.2042788718060817, "3": 0.03243901545234168, "2": 0.0034048084379799002, "1": 0.0025659743729437553}, "score": 4.71034532744058}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6588701532060101, "4": 0.22780064421226168, "3": 0.07520154522745662, "1": 0.021053888691017587, "2": 0.016910982771328693}, "score": 4.4867642147096936}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.36920962751521474, "4": 0.35046592342049304, "3": 0.19677549881613143, "2": 0.04638384724859434, "1": 0.03708779274633712}, "score": 3.968400613006273}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.36956348872923733, "5": 0.3074882819319651, "3": 0.1813528677561467, "1": 0.07258311209369216, "2": 0.06890641495493251}, "score": 3.7705489641414145}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.325171904359249, "4": 0.21353419397586978, "2": 0.17774502490023547, "1": 0.1545289069724622, "5": 0.1289395228067936}, "score": 2.9846091625978257}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.31510104935372524, "3": 0.2538097013609392, "5": 0.2412367168422807, "2": 0.10187677339646072, "1": 0.08787102188785623}, "score": 3.520010130249671}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3292405303657991, "4": 0.3160175591527272, "3": 0.2181890914909315, "2": 0.07148084980867776, "1": 0.06496759317178949}, "score": 3.7731632834307303}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3239639288815566, "1": 0.31337434896526684, "3": 0.223696423174326, "4": 0.11162779510104776, "5": 0.027209706846126974}, "score": 2.2152342912530725}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3925701624109616, "5": 0.3850550106870498, "3": 0.1685472757992787, "2": 0.036548786296493045, "1": 0.01720013579733502}, "score": 4.091816974380474}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3522983067216604, "5": 0.3153467348427896, "3": 0.2614006999757701, "2": 0.05080519834535745, "1": 0.020102499870177454}, "score": 3.8920231111354537}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.46800191087808257, "4": 0.3585688812573579, "3": 0.1370664821077978, "2": 0.0240077760266692, "1": 0.012270484923163903}, "score": 4.246129211203758}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.49819809496359346, "4": 0.3509449168088258, "3": 0.11578057199296836, "2": 0.022511112563162766, "1": 0.01250389604046264}, "score": 4.2999020259958565}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3940322185728094, "5": 0.3601182965434679, "3": 0.15856791367345457, "2": 0.04781885792628081, "1": 0.03930277311003634}, "score": 3.9880024287937164}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4051775147013016, "4": 0.39126629086539166, "3": 0.16157662348680196, "2": 0.03125669142879272, "1": 0.010686179584510909}, "score": 4.149034439157344}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3833032989223003, "5": 0.36372750657607644, "3": 0.19929331394859648, "2": 0.03881921589210524, "1": 0.014774130009934012}, "score": 4.042476876627655}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7415538848379893, "4": 0.20176248302829186, "3": 0.04586267378713431, "2": 0.005974468136131566, "1": 0.0047271584855942675}, "score": 4.669640708702614}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4103141471966918, "4": 0.3821996128988496, "3": 0.16510408265253246, "2": 0.03026100073356687, "1": 0.011992585441926624}, "score": 4.148729429054036}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.286010801898396, "1": 0.24900574761317437, "2": 0.2290223687654101, "4": 0.1736282429819981, "5": 0.062241879621112245}, "score": 2.5710391203283733}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7925183332973842, "4": 0.14266806082191075, "3": 0.05376044528341106, "2": 0.006887521382298323, "1": 0.004114318796960414}, "score": 4.712676463712535}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.36347360431852493, "3": 0.24522093482404556, "5": 0.23320639548244854, "2": 0.09156281861706371, "1": 0.06644644460964909}, "score": 3.605485061306309}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.370487712291908, "5": 0.3371482953070009, "3": 0.1879826514371197, "2": 0.0599113265950057, "1": 0.04437311104910895}, "score": 3.8962136002858547}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6548243547469971, "4": 0.2149744704495481, "3": 0.08946014143435314, "2": 0.02054671304462073, "1": 0.020160028945324798}, "score": 4.463806604955574}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3940105473967507, "4": 0.2945536556869888, "3": 0.17118685495966923, "1": 0.08703867664297717, "2": 0.05281217118325546}, "score": 3.8560260049392805}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2980095637115271, "5": 0.28316010479078163, "3": 0.2703556404125554, "1": 0.08402138745395617, "2": 0.06422954317939428}, "score": 3.6321989163209185}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3142934108257094, "3": 0.2760361896335551, "5": 0.25778228677794174, "1": 0.07944399269477433, "2": 0.07224743892664101}, "score": 3.5988403406671092}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3637568969459627, "5": 0.3412880967111883, "3": 0.19450424324343218, "2": 0.052258616115497654, "1": 0.04798740971905235}, "score": 3.8982835669353055}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.35426973242026666, "5": 0.3228463065879606, "3": 0.2059613807201403, "1": 0.06333982504703152, "2": 0.05346897499107417}, "score": 3.8199070097220873}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4106892430945326, "3": 0.2459574808652143, "5": 0.2085957313399422, "2": 0.09140029252818192, "1": 0.043111409298552596}, "score": 3.650417495155163}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8124172224742986, "4": 0.14052519253259102, "3": 0.0398381055042726, "1": 0.00369379313146826, "2": 0.003462024657241557}, "score": 4.754621728763346}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.39020478028875893, "4": 0.2542289601711916, "3": 0.24854399670552452, "2": 0.05719887778112188, "1": 0.04971429805650378}, "score": 3.878106836892374}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5901225805607291, "4": 0.300618548092195, "3": 0.08590274454815046, "2": 0.012412485720802844, "1": 0.010824155738062537}, "score": 4.446975804412773}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8988888639589422, "4": 0.08693815284208739, "3": 0.012415718352954982, "2": 0.000848474098481905, "1": 0.0008288080281761475}, "score": 4.882360346904494}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2514112586545492, "1": 0.2376535115238344, "2": 0.22920178642420563, "4": 0.18894196019486678, "5": 0.09260534663110694}, "score": 2.6695823411750506}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.49889665943423006, "4": 0.3363395714652859, "3": 0.12543689193385751, "2": 0.024289886710928268, "1": 0.014920472735850397}, "score": 4.280151218452151}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3747715644847122, "1": 0.30372973579041906, "3": 0.24890661326343375, "4": 0.05708360679214832, "5": 0.015343167776914888}, "score": 2.105391016776478}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6320748236448018, "4": 0.30320746645679186, "3": 0.05336527635756957, "2": 0.0066117738670094595, "1": 0.004638576261606792}, "score": 4.551626582692226}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4126171143200754, "2": 0.29991322385036834, "3": 0.17127892688289928, "4": 0.08000075554822823, "5": 0.036084552998311974}, "score": 2.026919820714006}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.432447974508241, "1": 0.34146735415069324, "3": 0.19402747620979233, "4": 0.026250201861819394, "5": 0.0057391492151128536}, "score": 1.922272700092918}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.34031061666644247, "3": 0.3091090350768473, "5": 0.22100213872997762, "2": 0.08143110122630338, "1": 0.047741306092197164}, "score": 3.6056469535868745}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.35435955118148216, "2": 0.21658053815473327, "4": 0.17446006803541195, "1": 0.17331715447473828, "5": 0.08108660483485991}, "score": 2.7733739930213526}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.609712466095324, "4": 0.2696633903961457, "3": 0.09092952709651536, "2": 0.016592319025663486, "1": 0.012987665235257427}, "score": 4.4466865098772015}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.33323567719724584, "3": 0.28685098904164674, "5": 0.1742572366380224, "2": 0.12508189452512106, "1": 0.08025864475258887}, "score": 3.3962760144482846}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31734476796656175, "4": 0.26439095000850477, "2": 0.20011897786212038, "1": 0.12349989167993952, "5": 0.09426554806995355}, "score": 3.0058054902255478}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4321101700444011, "3": 0.285913174476577, "5": 0.18240736935362856, "2": 0.07261825082283199, "1": 0.026787827296561637}, "score": 3.6708404898744}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4145453091528133, "5": 0.383547540906527, "3": 0.16309803781363127, "2": 0.024727096805333696, "1": 0.013863400070130897}, "score": 4.129433405388315}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4461932610850182, "4": 0.30925070128997034, "3": 0.15588587655476066, "1": 0.0442990210663617, "2": 0.04415620580391387}, "score": 4.0691127644200735}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4729587044046419, "4": 0.32591616280465546, "3": 0.14223973077073582, "2": 0.03186109519040067, "1": 0.02692210453187401}, "score": 4.186249504784815}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7110727526581279, "4": 0.23779279351491114, "3": 0.04422017703746083, "2": 0.0034509973595245103, "1": 0.003389299554602703}, "score": 4.6498307566362}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5783554407032652, "4": 0.32037016054724204, "3": 0.08779422982796033, "2": 0.0077029284826859055, "1": 0.005712779478113229}, "score": 4.458046541595724}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.775215146319973, "4": 0.16184991885003, "3": 0.05131211473536829, "1": 0.006190799751907838, "2": 0.005379593313241406}, "score": 4.694607861929252}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9417627724862175, "4": 0.052045273237732594, "3": 0.0056039644175563015, "2": 0.00028104071665479733, "1": 0.0002783553564337673}, "score": 4.934788389704664}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.946503761713432, "4": 0.04666890415554846, "3": 0.005904113308789422, "1": 0.0005597325934368602, "2": 0.0003187386723017459}, "score": 4.938324962905663}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32147782861491503, "4": 0.2774236829544356, "2": 0.15477988006718843, "5": 0.1381955041021635, "1": 0.10780427117529302}, "score": 3.183484769756364}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.28992506092466325, "2": 0.2385540904566955, "1": 0.23679968647044503, "4": 0.17348642929053132, "5": 0.06108127650176308}, "score": 2.5834315938268775}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6879900523134865, "4": 0.23805115296026216, "3": 0.06234192039101958, "2": 0.007516841068146583, "1": 0.004001785269728984}, "score": 4.598667911900414}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6318891283821257, "4": 0.23001386253130016, "3": 0.10152051324337338, "2": 0.01861944340313966, "1": 0.01777029563867204}, "score": 4.439900995919381}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.706811583512584, "4": 0.22459329279798276, "3": 0.05526933749005079, "2": 0.007098629086406996, "1": 0.006055586769900353}, "score": 4.619284478390436}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.49867150830259493, "4": 0.3600926210242675, "3": 0.10690870853037436, "2": 0.019227800586492795, "1": 0.014948317907861343}, "score": 4.308508843176892}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.653667151330546, "4": 0.27324990488865647, "3": 0.06475922613380802, "2": 0.005558886280760244, "1": 0.0027122140093911286}, "score": 4.569683485846304}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4185129523789469, "4": 0.3447436091901689, "3": 0.18753683491237666, "2": 0.02939105801646644, "1": 0.01973293917893947}, "score": 4.113004518784609}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9044976882337233, "4": 0.083435917237975, "3": 0.01087028564397187, "1": 0.0006195317544603107, "2": 0.0005311876018315373}, "score": 4.890746862702406}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8331504090746713, "4": 0.147027240477546, "3": 0.017496181882497183, "1": 0.0012747992037870583, "2": 0.0009933393600369963}, "score": 4.8098901487872565}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2934134125809374, "2": 0.23942590109550935, "3": 0.2373769725587653, "4": 0.16817496217248012, "5": 0.06136675745326868}, "score": 2.464526169292993}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30933526199062406, "2": 0.24146810137917293, "4": 0.1979590673925343, "1": 0.18581996576619328, "5": 0.06520518426132706}, "score": 2.715200906205074}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5066075693771657, "4": 0.3651233636135459, "3": 0.10128884421511296, "2": 0.01700972567470206, "1": 0.009773848310008522}, "score": 4.342044991623009}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8246229726117118, "4": 0.13402803292203178, "3": 0.030180809608747756, "1": 0.005980259603531972, "2": 0.005050148147432082}, "score": 4.766506694972084}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3552253862924774, "3": 0.27522035810136025, "5": 0.15228361630734163, "2": 0.13022852333073084, "1": 0.08692115809449745}, "score": 3.3557648119425862}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"3": 0.37715118149305443, "4": 0.24229143512736495, "2": 0.18077248994229198, "5": 0.10411963546150119, "1": 0.0954577536048546}, "score": 3.078859072500598}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.37423026095970363, "3": 0.2966419271590624, "5": 0.18468165868193825, "2": 0.09956446053554072, "1": 0.044680178933979506}, "score": 3.554780555819091}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4231422787957024, "5": 0.4002480496286535, "3": 0.15343856808112652, "2": 0.01689021193979314, "1": 0.006089106036935138}, "score": 4.194799099203241}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4339849295603347, "4": 0.4306117400607772, "3": 0.11807170140841108, "2": 0.012358304657414354, "1": 0.004907353914799885}, "score": 4.276492797432659}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3884496572263192, "4": 0.3798480555653263, "3": 0.1722725953573454, "2": 0.03554835488122023, "1": 0.023347531915596728}, "score": 4.07507783328661}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"1": 0.29201812696307106, "3": 0.2622040923584313, "2": 0.234794034049215, "4": 0.13795223181713773, "5": 0.0728521451975202}, "score": 2.464730223103219}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6081357797447515, "4": 0.14857681228870037, "1": 0.12208315110199358, "3": 0.09045305428945535, "2": 0.03053619126403226}, "score": 4.0903803224128685}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5376115852829005, "4": 0.2330347022059858, "3": 0.13999314805987734, "1": 0.051098164611535796, "2": 0.03809546244018945}, "score": 4.168161090883247}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8091439030932902, "4": 0.14290657270036985, "3": 0.03534906630003941, "1": 0.007078257623070981, "2": 0.005398090494915922}, "score": 4.741855954519681}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6011648795851725, "4": 0.17117583088118896, "3": 0.1067531840662209, "1": 0.08190766522596445, "2": 0.038860545405203666}, "score": 4.170991187832497}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6957129582654333, "2": 0.1640063389124043, "3": 0.09014047429265569, "4": 0.03287391476433109, "5": 0.01711981524655433}, "score": 1.511463221381188}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.3924142645058256, "3": 0.2209590254185517, "2": 0.21260368079145675, "4": 0.12018168975185538, "5": 0.053721622762121356}, "score": 2.2301005555981357}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32153856151278204, "4": 0.21786076781141572, "1": 0.16252133394730597, "5": 0.15875380071247874, "2": 0.1391309643312295}, "score": 3.071208592186285}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.33207092611679184, "3": 0.2413990272368956, "2": 0.1762213154067744, "4": 0.16408754214630827, "5": 0.08611798537413684}, "score": 2.495908321118199}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3030436574071103, "4": 0.22083614009643282, "2": 0.19753569041602603, "1": 0.19665001575251484, "5": 0.08185171683526009}, "score": 2.7936867733416664}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4104816716209863, "4": 0.2971887857079526, "3": 0.20633149593609362, "2": 0.04894889423226467, "1": 0.03693968616688906}, "score": 3.9954328287681964}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8612060917127942, "4": 0.10904343389746364, "3": 0.024969375125839532, "2": 0.002446927801159498, "1": 0.002298246817432511}, "score": 4.824477739602699}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5710782719494376, "4": 0.2889472596742866, "3": 0.11347496943433362, "2": 0.01632154932209858, "1": 0.01004883672432347}, "score": 4.394864675819569}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8285744623937041, "4": 0.13569000092598596, "3": 0.028794620427488486, "2": 0.0036306267035531013, "1": 0.003174574726558045}, "score": 4.783101142812196}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6869851793438395, "4": 0.23062884321022842, "3": 0.059591412551405085, "1": 0.012356253349104522, "2": 0.01036871686179256}, "score": 4.569627216047424}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.644151018237441, "4": 0.23867685811550754, "3": 0.09387219964705358, "2": 0.011794593859407405, "1": 0.011396312965197794}, "score": 4.49255438886418}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.33888217445391133, "5": 0.3115302608148224, "3": 0.22194952229799356, "2": 0.06844586076526034, "1": 0.05908443242578516}, "score": 3.7754115204704704}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3281056889801687, "5": 0.3064318798562299, "3": 0.2671080021330347, "2": 0.05868378649066933, "1": 0.03954893551691862}, "score": 3.803285556661825}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5236246856758289, "4": 0.277345460505726, "3": 0.13520812784276826, "1": 0.03234459017482711, "2": 0.031390317295750175}, "score": 4.228622001337469}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8826152621806264, "4": 0.09377856192480119, "3": 0.01957676255568218, "1": 0.002420363363205549, "2": 0.0015429964597465794}, "score": 4.8527477436025075}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2944289386245074, "4": 0.21739828348051568, "2": 0.20829015404068596, "1": 0.18347319471597817, "5": 0.09615539483432996}, "score": 2.8344304693360503}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3789983604115369, "5": 0.2804725835923814, "3": 0.2179395387159627, "2": 0.0719039268721749, "1": 0.05045370983500254}, "score": 3.767310105360974}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32315910238253914, "4": 0.3035596036864155, "2": 0.15726072220543366, "5": 0.12811399826195902, "1": 0.08768049590040597}, "score": 3.2272172549274103}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.41453672815372744, "4": 0.3780560061196887, "3": 0.144071150606504, "2": 0.038097294876002545, "1": 0.02496276411064325}, "score": 4.119415660888905}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4067350737215335, "4": 0.293296305322799, "3": 0.18819752553083485, "2": 0.06126157302859382, "1": 0.05030673068466418}, "score": 3.945083073381976}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6659502972369246, "4": 0.28565074092326315, "3": 0.04290946706019575, "2": 0.003300576925106836, "1": 0.002117888239907304}, "score": 4.6101293488593}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6705163847127905, "4": 0.27760861971083955, "3": 0.04537250382643179, "2": 0.004041280022253182, "1": 0.002377863223070507}, "score": 4.609978571974461}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8738769698475408, "4": 0.10952548687061235, "3": 0.015690740777488343, "2": 0.0005648044460018035, "1": 0.0003132030048074902}, "score": 4.856141663808681}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8941377883621808, "4": 0.09611557551693951, "3": 0.008895557359164573, "2": 0.0004595076351928741, "1": 0.0003510884050401937}, "score": 4.883305709136516}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7941435107893904, "4": 0.17303055181320265, "3": 0.02834241026984245, "2": 0.002448151570977036, "1": 0.0019882878250803604}, "score": 4.754975483985238}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"3": 0.36246328230888164, "2": 0.2261480965166419, "1": 0.18981495546382132, "4": 0.1731445645836656, "5": 0.04828831369902274}, "score": 2.6638958653007734}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3874243403353996, "3": 0.2723708832783748, "5": 0.24531771809901143, "2": 0.06070870384561052, "1": 0.03404254884984958}, "score": 3.749367743317936}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3509043148308207, "4": 0.34348442857727807, "5": 0.17486507542526886, "2": 0.08998106677043216, "1": 0.04053630445927787}, "score": 3.5222804066857374}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3496868987044307, "3": 0.28594502697836516, "5": 0.2296554813999187, "2": 0.08079383628227842, "1": 0.053691724257750525}, "score": 3.6209615550845244}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.37292416164396597, "3": 0.25488324536192447, "5": 0.21333126215331383, "2": 0.09376918453748587, "1": 0.06487240099712012}, "score": 3.5761993165141015}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3239589722713629, "2": 0.27048998646350825, "4": 0.18021164738858697, "1": 0.16713807696655752, "5": 0.05816423686353664}, "score": 2.6917625512601204}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.41140014060143754, "3": 0.31427119106704177, "5": 0.1866300992474527, "2": 0.06522022231063816, "1": 0.022378012209364216}, "score": 3.674751793294009}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4205236746352506, "3": 0.27329362837122395, "5": 0.2410961409348619, "2": 0.045261671879913916, "1": 0.019738015143637374}, "score": 3.818049317492671}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7760134472644727, "4": 0.1911189633611625, "3": 0.02982623809121706, "2": 0.001879520477188947, "1": 0.001122614768412245}, "score": 4.739089308067696}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.40613799011297363, "3": 0.3183566448358034, "5": 0.15544907390586643, "2": 0.08514560397850356, "1": 0.03477547089746647}, "score": 3.562415639895941}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9761930626877475, "2": 0.022171748292126533, "3": 0.0014101601492690762, "5": 8.176395985605617e-05, "4": 7.473694573061289e-05}, "score": 1.0255450858200346}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3977356461632307, "4": 0.2479172643425089, "3": 0.20067341366327038, "1": 0.07701549835841616, "2": 0.07653285142012732}, "score": 3.8129265894123905}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5389008913643407, "4": 0.32466964192813635, "3": 0.11641041171053461, "2": 0.01302672841940936, "1": 0.006868242691571208}, "score": 4.37587893525923}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5590442778108213, "4": 0.2577869011221733, "3": 0.12973443832074041, "2": 0.028665527802662738, "1": 0.024580692547427785}, "score": 4.29829283373683}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.24391474999611737, "5": 0.21720145327319776, "1": 0.21204094206666393, "2": 0.16360832005904277, "4": 0.16311477253078724}, "score": 3.0098286519845603}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.35675036482172356, "3": 0.20783202451330515, "4": 0.16788908935600047, "2": 0.15956506642076715, "5": 0.10778605379287656}, "score": 2.5103085290742246}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.34257098064244684, "5": 0.31911459778610285, "3": 0.24855088146958682, "2": 0.05613755280117669, "1": 0.033443350547047}, "score": 3.857932612346542}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.43235126833331333, "4": 0.4088698699280907, "3": 0.11937231172690568, "2": 0.02265049438814808, "1": 0.016591321857255256}, "score": 4.217939904319608}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6874324079388688, "4": 0.2456976165876546, "3": 0.052697287254837036, "2": 0.007737971545134447, "1": 0.006363819700930065}, "score": 4.600210271582136}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7225655763500616, "4": 0.2138202650079844, "3": 0.048599637837827885, "2": 0.008130542739699462, "1": 0.0067321817843182035}, "score": 4.637605093761292}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3368193990982393, "2": 0.21433486441024166, "1": 0.19716924645791487, "4": 0.15626167080547204, "5": 0.09527665134178204}, "score": 2.738105430743884}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5170344356596788, "4": 0.2878103277527108, "3": 0.15467972347000072, "2": 0.024912028994856877, "1": 0.015440871371499656}, "score": 4.266240684588298}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5504605981722337, "4": 0.291423804045615, "3": 0.11282547761959401, "2": 0.023115370340908846, "1": 0.021980741398050032}, "score": 4.32552531032897}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9243783328558525, "4": 0.06756189083105311, "3": 0.007225968539919314, "2": 0.0003846459335245168, "1": 0.0003128173763015035}, "score": 4.915569453145729}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8030282621107465, "4": 0.15931477768252877, "3": 0.03219731226328218, "2": 0.003003809387468783, "1": 0.002348457380976448}, "score": 4.757859338755876}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4462434829627365, "5": 0.26957740845149814, "3": 0.187812021877427, "2": 0.054569956223090244, "1": 0.041433787823594075}, "score": 3.8482689803045567}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.48918971476085643, "4": 0.3695422874800526, "3": 0.1082195007571356, "2": 0.020013860909465164, "1": 0.012731900303257424}, "score": 4.302838471318643}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5519269380887936, "4": 0.3464037072944303, "3": 0.08765292472024062, "2": 0.008093160149660711, "1": 0.005644582744814643}, "score": 4.4312741353306295}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6555159129658787, "4": 0.2738821704334538, "3": 0.055613044051405526, "2": 0.007884989422808958, "1": 0.006958212933730214}, "score": 4.563340313159651}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4724029027457966, "4": 0.3719719986456627, "3": 0.12030825960051326, "2": 0.021016708810155257, "1": 0.01409512903208499}, "score": 4.267830744043481}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3756230180922859, "4": 0.21855429622662015, "5": 0.1573322921149568, "2": 0.14190249672637492, "1": 0.10646589285583391}, "score": 3.1784063643056952}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6889215466371883, "4": 0.2529730544694243, "3": 0.04910292861665622, "2": 0.005076790542617516, "1": 0.0038635454759445597}, "score": 4.618112806488159}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9400078412477069, "4": 0.049685079610280174, "3": 0.009204074615372645, "2": 0.0005392784044988474, "1": 0.0005159323013624612}, "score": 4.928221776184463}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9786225786440613, "4": 0.018274758284502084, "3": 0.0026507875353055416, "1": 0.0002668435570337185, "2": 0.00014177943253198855}, "score": 4.974929869772181}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6517327068047651, "4": 0.22460432059938945, "3": 0.08480273367248828, "1": 0.02187618886720902, "2": 0.016882606301253832}, "score": 4.467583627367028}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7577873451469949, "2": 0.14336669933427879, "3": 0.06347725666468233, "4": 0.020316274796950858, "5": 0.014874573503427226}, "score": 1.3908378417947616}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2958854478703733, "4": 0.25546407139234667, "5": 0.2478669918191064, "2": 0.11374049330321996, "1": 0.08656040370673747}, "score": 3.464560947668082}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31728917403338475, "4": 0.29724974537910187, "5": 0.1575748492926575, "2": 0.13902854600415235, "1": 0.08872982503658136}, "score": 3.2959490880127023}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.2973573097942094, "3": 0.26710615909417845, "2": 0.26098634266045084, "4": 0.12768338934641732, "5": 0.04672154834804871}, "score": 2.3653333379807377}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.38132753547501497, "2": 0.24523763493833947, "3": 0.19850406509432014, "4": 0.11783384971708628, "5": 0.05680590485179475}, "score": 2.2233269339628174}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4357775814869796, "4": 0.3045718375355112, "3": 0.14652116353041944, "1": 0.06418395638896256, "2": 0.04868861765148808}, "score": 3.9993271406672126}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7232128513088789, "4": 0.2059368315867159, "3": 0.05442761093118867, "1": 0.008431080854028413, "2": 0.007875948161955203}, "score": 4.627812725083007}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7936610563865015, "4": 0.13558581745305964, "3": 0.054556386362459686, "1": 0.009770645944653556, "2": 0.006317157087206373}, "score": 4.6972343724734325}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7914094810531771, "4": 0.15093457714402653, "3": 0.040444439942234484, "1": 0.011078194081294518, "2": 0.006023121093153772}, "score": 4.705761982254762}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2992693125854661, "3": 0.2447144398141821, "1": 0.160480602566382, "5": 0.15816414386522837, "2": 0.13729697479371597}, "score": 3.1573511472000506}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2785484686798495, "4": 0.2471434355926673, "2": 0.2309058563036129, "1": 0.18003282204864662, "5": 0.06326030118819616}, "score": 2.7826688232188213}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6479146203693991, "4": 0.27229920469521124, "3": 0.06873674232090057, "2": 0.005548978623286504, "1": 0.005389005604728774}, "score": 4.551974420646295}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.876664994407691, "4": 0.10758771614420867, "3": 0.013852788927691513, "1": 0.0009619363247286644, "2": 0.0007999670649150461}, "score": 4.858440289095251}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8486249884250316, "4": 0.13554647615753285, "3": 0.013410580420004144, "1": 0.0012304097930545175, "2": 0.0009869192849904333}, "score": 4.829715802551599}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8509417769196796, "4": 0.12711606655538446, "3": 0.018547445654060874, "1": 0.001925955636268495, "2": 0.001358520553034932}, "score": 4.823990255554182}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3214454895720375, "1": 0.2780292930942476, "2": 0.27798950994895777, "4": 0.08145370149253561, "5": 0.04094983901288769}, "score": 2.329216628035876}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9908887512850844, "4": 0.007817769463176819, "3": 0.0010558227058299796, "1": 9.133404027838333e-05, "2": 0}, "score": 4.989703742389837}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5805460806674206, "4": 0.2751348329053663, "3": 0.12071628967018112, "2": 0.013378999538299479, "1": 0.010087835368406675}, "score": 4.4028630598224625}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4324502881110935, "4": 0.19657123387620584, "3": 0.17502824816489604, "1": 0.12327230608507463, "2": 0.07247385520658242}, "score": 3.742604885028337}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9745823341440938, "4": 0.022351744662660687, "3": 0.0026189652027739053, "1": 0.00022235730231793998, "2": 0.00014379426431739096}, "score": 4.971087176645535}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"4": 0.41459815046542325, "5": 0.28327766894903317, "3": 0.20403374135821847, "2": 0.05507395283008251, "1": 0.042875200376610655}, "score": 3.8404478783164615}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8556103372281831, "4": 0.11425676942253327, "3": 0.02586667805992895, "2": 0.0022348025485210694, "1": 0.0019647760689042396}, "score": 4.8194343302411315}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7287561516360447, "4": 0.2015546940370523, "3": 0.06016815820943906, "2": 0.0052609639950674724, "1": 0.004208334564223978}, "score": 4.645474431195754}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9342932853812175, "4": 0.05907331378189985, "3": 0.0059618526433970085, "2": 0.0003316580797533013, "1": 0.000303345238527139}, "score": 4.9267919503589}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7739004896511145, "4": 0.19436409510036096, "3": 0.028214608591849464, "2": 0.002148279477996671, "1": 0.0013068330340181}, "score": 4.7375172735676765}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5710687350219296, "2": 0.24724552691197338, "3": 0.13209308705154227, "4": 0.032599810614418995, "5": 0.016785430516435117}, "score": 1.6765131704420588}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.2659916398046968, "2": 0.26016318766184793, "3": 0.2482494479067282, "4": 0.1604198240263121, "5": 0.06504781917179406}, "score": 2.4983047372526737}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3636236044705701, "5": 0.35488062984872837, "3": 0.2166199377379071, "2": 0.04262669409517101, "1": 0.022083792732923168}, "score": 3.9867537355695837}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4347093335384185, "4": 0.39768328771198397, "3": 0.13054656447012544, "2": 0.024682297319956917, "1": 0.012270286142918271}, "score": 4.218010911498603}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5775376349297805, "4": 0.2846791563666077, "3": 0.10253915021625103, "2": 0.020706077971451704, "1": 0.014444369418212697}, "score": 4.390289755968464}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3755332511627559, "4": 0.3349101473497719, "3": 0.2003886997168098, "2": 0.049360064137685504, "1": 0.039671457679346135}, "score": 3.9574042409248897}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7488430226553797, "4": 0.2005731421510597, "3": 0.04294618752142124, "2": 0.004340277468844353, "1": 0.003009181993838255}, "score": 4.68838711926607}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3400139271516919, "5": 0.23356048476988495, "4": 0.22610832056486216, "2": 0.11566228156081709, "1": 0.08457225679646105}, "score": 3.4084562861948275}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7053649997528455, "4": 0.20129835867420695, "3": 0.07274375634863742, "2": 0.011009864888834531, "1": 0.009424496206198093}, "score": 4.582420352687228}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6168085715644833, "4": 0.2554941923819613, "3": 0.1041460331348544, "2": 0.014205851809555935, "1": 0.009206235065203744}, "score": 4.456695663308871}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.44050613779616093, "2": 0.2378184289597777, "4": 0.20243338692690083, "1": 0.06693508565973791, "5": 0.052209698830599324}, "score": 2.9351578776455707}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3909231443821623, "2": 0.2768958323555298, "4": 0.20163763069708038, "1": 0.09969114723388985, "5": 0.030813329704880727}, "score": 2.7869778733940267}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3610911353561204, "3": 0.3292999965752202, "5": 0.17839918985822256, "2": 0.09382580070231233, "1": 0.037278355584330285}, "score": 3.549564994357048}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3494712783294694, "4": 0.3030646893667349, "2": 0.15984160865094468, "5": 0.09843104762963145, "1": 0.08909990595547838}, "score": 3.1619001730838954}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.36566904620454, "3": 0.3551141826338704, "2": 0.12149930942044893, "5": 0.09622979018166736, "1": 0.06142083310465436}, "score": 3.313808625421749}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.47979132940937047, "4": 0.3161268253084931, "3": 0.1318956762911123, "2": 0.03717132307754164, "1": 0.034624754664553385}, "score": 4.169744958992569}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.517930197325859, "4": 0.3242342274970992, "3": 0.13372698269707925, "2": 0.016508474893982095, "1": 0.007358528487458485}, "score": 4.329190208144068}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3396379437750493, "3": 0.32786684938950245, "1": 0.19515077774367814, "4": 0.10227916422844473, "5": 0.03485984797204604}, "score": 2.4419447269307755}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5529467362005641, "4": 0.3308068197877219, "3": 0.09264156240136139, "2": 0.015714610410062144, "1": 0.007713062182690169}, "score": 4.405808679388415}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4903740067231116, "4": 0.328950366927525, "3": 0.1305134229049062, "2": 0.030890110340872433, "1": 0.019085442639433656}, "score": 4.2408689935276005}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.34172853992827523, "4": 0.336045100616974, "3": 0.218356135513892, "2": 0.0664964976250354, "1": 0.03724939410225991}, "score": 3.8786161349328983}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7691209189731875, "4": 0.18657938007952435, "3": 0.03586881585894499, "2": 0.004913655073302024, "1": 0.0034461603835922406}, "score": 4.713136994200212}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8460132140952208, "4": 0.116158144696337, "3": 0.033822263834770404, "2": 0.0028042251977493334, "1": 0.0011461900921142377}, "score": 4.8031888777118965}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5177894948065483, "4": 0.2984733887618847, "3": 0.12818121167922522, "2": 0.033164309379383916, "1": 0.022323594735031618}, "score": 4.2563263105160924}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8222103881666194, "4": 0.150852189358818, "3": 0.02366840127464251, "2": 0.001966873603805629, "1": 0.0012552603220252723}, "score": 4.790879540904095}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"5": 0.412688668331252, "4": 0.34104549301358467, "3": 0.14400726921795498, "1": 0.05577777982072969, "2": 0.046292584162262757}, "score": 4.008764540860975}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.564000748701517, "4": 0.28712480417302844, "3": 0.1125265820904703, "2": 0.02028297732778656, "1": 0.01594783014614089}, "score": 4.363107225963323}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8058591529070858, "4": 0.16209454546575852, "3": 0.027633742461927298, "2": 0.0024276649731621164, "1": 0.0018815764806361462}, "score": 4.767804678879172}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6456826821383507, "4": 0.27892083024268755, "3": 0.05944675149376257, "2": 0.008142329178768911, "1": 0.007734482506804875}, "score": 4.546787698953176}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7975341770550142, "4": 0.17260160524490759, "3": 0.023741198658126354, "1": 0.0033111530393375244, "2": 0.0027300880979352266}, "score": 4.7584613684644985}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"1": 0.768802376615144, "2": 0.16229597573400842, "3": 0.0546155138578377, "4": 0.011097382603010351, "5": 0.0031339831862864996}, "score": 1.3173724658602495}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.4292338387002988, "2": 0.3383268293348409, "3": 0.17565393465154683, "4": 0.047353146954795984, "5": 0.009286084404407199}, "score": 1.8689654902899284}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.37619731473732443, "3": 0.36209813961121623, "5": 0.11127415031627043, "2": 0.09633116388657138, "1": 0.05403657212942621}, "score": 3.3943660179306367}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4262184801418101, "4": 0.38683628950010995, "3": 0.14648020193979355, "2": 0.022755411357538568, "1": 0.017553059741876337}, "score": 4.181596706554804}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.42620871985037057, "3": 0.2760289299772326, "5": 0.15493156123343824, "2": 0.0835681426747816, "1": 0.05916438635241764}, "score": 3.5342274200767867}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.24759124456611695, "1": 0.24228474797603852, "2": 0.20261533480046293, "4": 0.1909034072614148, "5": 0.11647142675081538}, "score": 2.7366261804153247}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5531174572074609, "4": 0.24999479033425462, "3": 0.1348728629770229, "2": 0.03240735097413229, "1": 0.029420743270645124}, "score": 4.265217203780537}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5764251632086864, "4": 0.22610364017106868, "3": 0.129435874252731, "1": 0.034037201185495296, "2": 0.033765490134789154}, "score": 4.277411239597072}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7707691859141764, "4": 0.18309643458365038, "3": 0.03706542813559724, "2": 0.005257636961695803, "1": 0.0036768407035405104}, "score": 4.7122537411414305}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.37204106165778705, "5": 0.32570542838940997, "3": 0.1902832932840068, "2": 0.06485161920926083, "1": 0.04696762708590523}, "score": 3.864795603570921}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.47023777873798006, "4": 0.33381631245499277, "3": 0.12332785276991727, "1": 0.03629980171946289, "2": 0.03602246526557995}, "score": 4.166014695607958}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3784636831930012, "2": 0.2210285279607477, "4": 0.1993834946411614, "1": 0.11423976928008513, "5": 0.08677107067697126}, "score": 2.923408879886247}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.303496925100041, "4": 0.2834725176555109, "5": 0.19884083468348837, "2": 0.11925530068653692, "1": 0.09486324033375425}, "score": 3.372198899359534}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7403057370015719, "4": 0.22368400836735391, "3": 0.03143319433578123, "2": 0.002522953600749132, "1": 0.0019757385522989734}, "score": 4.697954117174931}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4027740275432628, "5": 0.36339880914744327, "3": 0.16829972698150034, "2": 0.037264281934533953, "1": 0.0281381041959699}, "score": 4.036160727615088}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8403081240999766, "2": 0.11625956015541251, "3": 0.031148396867525182, "4": 0.008152232197225918, "5": 0.004062725196004417}, "score": 1.2192790730764163}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8919625746078431, "4": 0.08761811589203267, "3": 0.016537666195120426, "1": 0.002237856703416554, "2": 0.001551478394079106}, "score": 4.865688291648778}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.32853743176984673, "4": 0.3220103149321592, "3": 0.2219661247431852, "1": 0.06821287151833207, "2": 0.05911004516867899}, "score": 3.7836772957016906}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4366434154210913, "4": 0.2495166581218191, "3": 0.17221649530942623, "1": 0.08211613936934588, "2": 0.05930509248627287}, "score": 3.8994479854849327}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.48853625170846554, "4": 0.2927947287383, "3": 0.15086908575020644, "1": 0.03521962582168145, "2": 0.032487950897613485}, "score": 4.1670478147470025}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"1": 0.43399207735098644, "2": 0.21943116384540287, "3": 0.17313959540597007, "4": 0.10393919648473322, "5": 0.06936757775183716}, "score": 2.1551488740114846}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.36318766312454465, "2": 0.24480426649578174, "3": 0.21336249613636485, "4": 0.11938479872377084, "5": 0.059048378293073224}, "score": 2.266146094030788}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.28045311947049295, "3": 0.2683744156900752, "2": 0.24945680625505418, "4": 0.12142977097308556, "5": 0.08023890355424668}, "score": 2.4715197027371048}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.2464879428704868, "4": 0.24498198542949334, "3": 0.22659248389062706, "1": 0.15710189050887513, "2": 0.12476376621722418}, "score": 3.2990118321804993}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3670040850731523, "2": 0.25550594538512783, "3": 0.22045786296965622, "4": 0.11187208036765668, "5": 0.045059411699490855}, "score": 2.212397544004025}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3519207045240187, "4": 0.22404882099598625, "2": 0.16696738250216644, "1": 0.13236857666698965, "5": 0.12450421602451651}, "score": 3.0413605880992707}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8926936536368806, "4": 0.09163360571190146, "3": 0.014362652757594165, "2": 0.000704063504935674, "1": 0.0005394628153085774}, "score": 4.875362750945469}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5568518237663816, "4": 0.21024938609803526, "3": 0.17022130404906521, "2": 0.03496118614981214, "1": 0.0275219145206276}, "score": 4.234187926573356}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7855770780519522, "4": 0.18607380181783917, "3": 0.025577301013225476, "2": 0.001627770975073088, "1": 0.001113962946165683}, "score": 4.7534250131890845}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.542264580905486, "4": 0.2951955384564333, "3": 0.1175690215985805, "2": 0.02428275867526902, "1": 0.02054763355798448}, "score": 4.314531322492749}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9511933792958548, "2": 0.03908813932812473, "3": 0.0069705649707379625, "5": 0.0013920799268558744, "4": 0.0012652785290142609}, "score": 1.062399075296371}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.31424224802319206, "5": 0.2214553477749037, "3": 0.17177067099216484, "4": 0.16025208056831874, "2": 0.13213845560697085}, "score": 2.8425175884152774}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4633965092134694, "2": 0.24306779081510377, "3": 0.16169245079115918, "4": 0.08844836000859162, "5": 0.043345798537619724}, "score": 2.0052303139671612}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7338667546655209, "4": 0.1666535453878735, "3": 0.05473171164327864, "1": 0.03005486602986594, "2": 0.014473831270881397}, "score": 4.560145617284887}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.38342106778410023, "4": 0.27683813327651974, "3": 0.17754446400505203, "1": 0.08859441140974177, "2": 0.07353257306369174}, "score": 3.793013868838845}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.327651052903863, "5": 0.2836843791044413, "3": 0.22468694526225, "1": 0.08541291159317317, "2": 0.07844390465636061}, "score": 3.64582810348985}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.797802089848478, "4": 0.1630560454756398, "3": 0.033746337029936374, "1": 0.002704639898350682, "2": 0.002660626919327296}, "score": 4.750643294372656}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4304246928142239, "4": 0.22832491469879931, "2": 0.15270034613427022, "1": 0.10551413014614097, "5": 0.08294040011711913}, "score": 3.0304800198387865}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7117986802571461, "4": 0.22260263563092125, "3": 0.054060153429732874, "1": 0.0059505513491198165, "2": 0.005516950593786123}, "score": 4.628897641399095}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4760522175652854, "4": 0.27801794973049554, "3": 0.14947851632342157, "1": 0.05945776799746192, "2": 0.03688578619909171}, "score": 4.074436846328443}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"5": 0.49555293471992373, "4": 0.19528366210014797, "3": 0.13184801780610764, "1": 0.12517381344252398, "2": 0.0520744163380838}, "score": 3.8840268556647715}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.32424171739426233, "5": 0.2648398434598735, "3": 0.2501052874446418, "2": 0.08790311824548785, "1": 0.0728089494011832}, "score": 3.6204631061926285}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5371314116386854, "4": 0.2742138232787713, "3": 0.1480895826730053, "2": 0.020339194315234805, "1": 0.02013416209294103}, "score": 4.287987398787661}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4110916321768544, "4": 0.35824602784413, "3": 0.16438655203164731, "2": 0.03685653262274964, "1": 0.029385544771141137}, "score": 4.084838240530328}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.49400357251925986, "4": 0.34568535371152953, "3": 0.13023770476526744, "2": 0.015733528035462185, "1": 0.014290281330576037}, "score": 4.289442312347534}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"4": 0.35728042548153593, "5": 0.3447170304825226, "3": 0.1922650481110594, "2": 0.06059126125609638, "1": 0.044839994654093815}, "score": 3.8967178467688663}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5647924276659555, "4": 0.3353076199500709, "3": 0.08077399575260427, "2": 0.010445012366611653, "1": 0.008605463385863241}, "score": 4.4373450282096485}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.432107836655783, "5": 0.4060051803414931, "3": 0.1365074345872054, "2": 0.015099736283237896, "1": 0.010148178984341678}, "score": 4.20888123192889}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8048045870806582, "4": 0.16186419464242577, "3": 0.02788111781775225, "1": 0.0027293685415543077, "2": 0.0026955592021121887}, "score": 4.763363461165248}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6066272998754898, "4": 0.2940482527824893, "3": 0.07769479595326448, "2": 0.0116032563550668, "1": 0.009970440633970491}, "score": 4.475841294724189}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3963272817498023, "2": 0.2525319256604898, "3": 0.20968000418667768, "4": 0.09187783176427872, "5": 0.04947690915307577}, "score": 2.1455545491186228}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8686777856411542, "4": 0.1024858847133747, "3": 0.022206316578766126, "1": 0.0037121602284420044, "2": 0.0028411297687923986}, "score": 4.829716387227495}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5284723991063229, "4": 0.2524582475947347, "3": 0.15141507080003466, "2": 0.035244950789425085, "1": 0.032283355214895046}, "score": 4.209743783869407}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9077268841570797, "4": 0.0787392908287494, "3": 0.011583515142583711, "1": 0.0011223139479660505, "2": 0.0007862424913087459}, "score": 4.8912411545652015}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8884834219773944, "4": 0.09062728067998388, "3": 0.016348551153993723, "1": 0.002559273115671117, "2": 0.001920210429980108}, "score": 4.860669357495997}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4026519249697972, "4": 0.19550351894500773, "5": 0.17945955801070426, "2": 0.11755268064030122, "1": 0.10476453194675729}, "score": 3.227356301890345}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.75454883340441, "4": 0.20749716542647337, "3": 0.03301354985905362, "2": 0.0025120018347056464, "1": 0.0023784744124533087}, "score": 4.7094113095134045}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4492459357967058, "4": 0.33388501892174893, "3": 0.1807055261405786, "2": 0.022640824691671457, "1": 0.013429810214584077}, "score": 4.182986326173901}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.945964095185414, "4": 0.0490690249338454, "3": 0.004335175002061939, "1": 0.00036737515915613974, "2": 0.00019635761399984213}, "score": 4.940197986714648}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9837223670970555, "4": 0.014286789212573038, "3": 0.0016466275364866224, "1": 0.00021851869203863452, "2": 8.748423082368634e-05}, "score": 4.981282713005816}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"4": 0.33234273773150846, "3": 0.3313471372967783, "2": 0.18177149549285743, "1": 0.11222822026560594, "5": 0.04221984955191411}, "score": 3.0105554567098523}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8389085896500383, "4": 0.14025452097261668, "3": 0.01804434391174034, "2": 0.0013775689000540695, "1": 0.0013337630112592745}, "score": 4.814173940863961}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6388255925278982, "4": 0.29432181542599006, "3": 0.05757341286770659, "2": 0.005290067358590946, "1": 0.003925482521066986}, "score": 4.55893116177768}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8068738763315124, "4": 0.169278075350191, "3": 0.0216354631087364, "2": 0.0012575063579239754, "1": 0.0008994314648250977}, "score": 4.780068514886839}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6809590069628622, "4": 0.2510522987502064, "3": 0.05733338440799892, "2": 0.00597872825514504, "1": 0.00459989408845989}, "score": 4.597914336355985}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27027819461621727, "4": 0.2554290496689528, "2": 0.18170556075557717, "1": 0.15435806160756219, "5": 0.13793300261632885}, "score": 3.0408854783776866}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6016413953221728, "4": 0.3207884844458089, "3": 0.0685073801569448, "2": 0.005830555500816315, "1": 0.0031290078672401704}, "score": 4.5121387213486805}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7746513669019901, "4": 0.19002086444162172, "3": 0.03153397950816802, "2": 0.0023529909862317175, "1": 0.0013566240248557159}, "score": 4.734403351115178}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9523153357552103, "4": 0.04201663364226526, "3": 0.0048008658112047705, "1": 0.00042780289250075014, "2": 0.0003773165755281269}, "score": 4.945535094146046}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7133661756951887, "4": 0.2424256048005904, "3": 0.03616217123663074, "2": 0.004413161292337325, "1": 0.0035397771705144737}, "score": 4.657819599816831}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.33049144666835784, "3": 0.2798485262143692, "2": 0.2598741769262325, "4": 0.08829371073615776, "5": 0.04113242660748842}, "score": 2.2494315045575264}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.2492915709237402, "3": 0.2474827491021414, "4": 0.23872653193806337, "2": 0.14915948147174476, "5": 0.11526658533465714}, "score": 2.821504034583511}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4164673549162077, "2": 0.20521255158252838, "4": 0.1845223656155392, "1": 0.14110415124047204, "5": 0.05253282850232278}, "score": 2.802135362183632}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.297975652152781, "4": 0.27382767330418184, "2": 0.15626682752569404, "1": 0.14355394371935395, "5": 0.12826754514995026}, "score": 3.0869974755250125}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5608779472297478, "2": 0.27694282556554156, "3": 0.11658544981857923, "4": 0.03915385867889538, "5": 0.006363434701484509}, "score": 1.6530789901425627}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.26380652614949973, "1": 0.21324620260796773, "3": 0.20987367014899597, "4": 0.2091475908346709, "2": 0.10368713823820704}, "score": 3.2066304579145393}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4578767664316586, "4": 0.24921691927789055, "3": 0.13863684369873736, "1": 0.10609705400062981, "2": 0.04794964409976728}, "score": 3.9050283154527263}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.398596401137939, "3": 0.19988169748933377, "2": 0.1485499520292792, "4": 0.13457381770125676, "5": 0.11818047190131761}, "score": 2.425066867402074}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5000743608089544, "4": 0.21118902361932582, "3": 0.12847871890451498, "1": 0.1164029733228853, "2": 0.04363446322153967}, "score": 3.9351034883997893}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.42165337024567984, "3": 0.18418212520798558, "2": 0.17526376696578003, "4": 0.13480476937630076, "5": 0.0837799718049557}, "score": 2.2835678155384413}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4111503978146378, "3": 0.3025267426391778, "5": 0.19298994304694533, "2": 0.06292735582777909, "1": 0.030329671142135223}, "score": 3.6735947045815656}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4764802046417681, "5": 0.42505394019723547, "3": 0.08648037235351604, "2": 0.008320857205075497, "1": 0.0036027404031723476}, "score": 4.311142887363627}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3845642514867527, "3": 0.34498756709704825, "5": 0.1473375155337123, "2": 0.08601533368148678, "1": 0.03700271095381239}, "score": 3.519266622087226}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5620772404551277, "4": 0.36674257777358604, "3": 0.061853703697772, "2": 0.006371508654490403, "1": 0.0029021434335019863}, "score": 4.4787993821971}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6203944646172133, "4": 0.270393087261887, "3": 0.07899384033484252, "2": 0.01718387903633301, "1": 0.012865982064722668}, "score": 4.4685139801965725}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2818346013921753, "2": 0.2777786237407505, "3": 0.23845880713166948, "4": 0.15171479035257804, "5": 0.05003194387746858}, "score": 2.410223964404107}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.39369766970937015, "4": 0.21603691135381764, "2": 0.20224925633692234, "1": 0.13028264452507426, "5": 0.05757235928389144}, "score": 2.868345867313685}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3730834342632722, "3": 0.326318461069644, "5": 0.159681719191038, "2": 0.09381206561052274, "1": 0.046932320707198855}, "score": 3.5048570005996047}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.355541748723381, "4": 0.3485392951655726, "3": 0.1944599596691219, "2": 0.054186948614722404, "1": 0.04704872557159304}, "score": 3.911541960461119}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2892059543126205, "4": 0.2306674537101905, "2": 0.21335287370477654, "1": 0.18062559969684697, "5": 0.08605630393762968}, "score": 2.828160211078977}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"2": 0.366808817464396, "1": 0.28707967170131765, "3": 0.26891847828856486, "4": 0.061453038345624024, "5": 0.01566416436625291}, "score": 2.1517488834698737}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.377143510316039, "5": 0.37481430961913664, "3": 0.1614745877651211, "2": 0.04779948087018895, "1": 0.0385572549819975}, "score": 4.002069431520623}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.44579717275890346, "4": 0.3577513453377097, "3": 0.16497911316056857, "2": 0.02141292215870577, "1": 0.010011328271525968}, "score": 4.207968237547008}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2993886550497332, "3": 0.291116514056318, "2": 0.16104879264567948, "5": 0.15701024829497925, "1": 0.09134600774128353}, "score": 3.2696925571057838}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6353954487393267, "4": 0.3229721443115258, "3": 0.038553222104049586, "2": 0.002148453495682009, "1": 0.000922487253028817}, "score": 4.589782720110418}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"1": 0.32568849214747986, "2": 0.203431589530576, "3": 0.19716137956192684, "4": 0.17140822273831602, "5": 0.10190898173479103}, "score": 2.5202250622498434}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4183654274596771, "5": 0.33086024940344294, "3": 0.20407671538915517, "2": 0.030247044553168973, "1": 0.01613744872816776}, "score": 4.017882698054906}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3314339947636376, "3": 0.3047936770412926, "5": 0.21396579782094435, "2": 0.09518843744221925, "1": 0.05424077213087959}, "score": 3.555905363358545}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5331461978639017, "4": 0.341298130728731, "3": 0.09619672168592847, "2": 0.016463376024420703, "1": 0.012442126074047528}, "score": 4.3668626989257735}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4228034141178883, "4": 0.37615459243432164, "3": 0.1534297916460407, "2": 0.028449297817424255, "1": 0.01874085460418643}, "score": 4.1563184371239315}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4315176351002666, "2": 0.30165261655221537, "3": 0.1896542881956567, "4": 0.05405580176253873, "5": 0.02298232584447727}, "score": 1.9351863331280872}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3845671357294547, "4": 0.2814556760796777, "3": 0.20445914569701218, "1": 0.0687810849427649, "2": 0.06067397626177931}, "score": 3.852407487113835}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.28969106990535864, "4": 0.2752487347830733, "3": 0.2668448701788601, "2": 0.09398077865642149, "1": 0.07398998002600839}, "score": 3.6128200111001267}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7033887660476914, "4": 0.16075742937187973, "3": 0.07713416274409299, "1": 0.03899125066281575, "2": 0.019657520327803796}, "score": 4.4699991198946565}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.34610911235872033, "4": 0.2968763074977448, "3": 0.21113285480982596, "1": 0.07294161881926456, "2": 0.07284291541544272}, "score": 3.770443259388313}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8299531712200342, "2": 0.1188457791381118, "3": 0.03478330321539847, "4": 0.00949699163999707, "5": 0.006539017854129578}, "score": 1.243152252100224}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.26395102616371224, "5": 0.2634425398146346, "3": 0.23356950037859722, "1": 0.12247920726701962, "2": 0.1162366825252066}, "score": 3.42977898663461}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32200355278654835, "2": 0.2998342071267943, "1": 0.18670114418221972, "4": 0.12667117797144434, "5": 0.06456786743945361}, "score": 2.5824777063277438}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6440990566706978, "4": 0.2753189596921228, "3": 0.06327536525921555, "2": 0.009315636002671044, "1": 0.007743759389974893}, "score": 4.539094417767544}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.28342574854865515, "5": 0.26734997796699134, "3": 0.23258668144889655, "2": 0.11216137460727069, "1": 0.10409878238702339}, "score": 3.497954710658034}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3102171943164755, "4": 0.2389558194491199, "5": 0.23111455090735655, "2": 0.12327636181066114, "1": 0.0962985998253261}, "score": 3.3853643372603663}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.2572948179515633, "3": 0.23063230266882248, "4": 0.20179860174528264, "1": 0.18240375772347062, "2": 0.12775946022477083}, "score": 3.2238461222567674}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5263954724378209, "2": 0.28593982282623204, "3": 0.11577521147658197, "4": 0.05405068832556139, "5": 0.017727797342059603}, "score": 1.7506368265107037}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7577788731318348, "4": 0.17445759072003486, "3": 0.052771352594996344, "2": 0.007814478874950242, "1": 0.007012847184379075}, "score": 4.668450220261846}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6258420224711363, "4": 0.23687549818310147, "3": 0.09638434372954817, "2": 0.021175777950842363, "1": 0.019618864522315618}, "score": 4.4282938547501365}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"1": 0.436345843948721, "2": 0.3474329785710646, "3": 0.18088610498615118, "4": 0.029810151175602526, "5": 0.005462787982727292}, "score": 1.8205377767502484}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6436243503354425, "4": 0.23464876497969245, "3": 0.09933227853265472, "1": 0.011567729468891735, "2": 0.010771660730783991}, "score": 4.488072511323164}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6743437724195008, "4": 0.21643539122064287, "3": 0.09002377291784695, "2": 0.010272369100489936, "1": 0.008868656143011343}, "score": 4.537199396558062}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.49289219512377397, "4": 0.317413702736209, "3": 0.13440835333961207, "1": 0.030070979756150806, "2": 0.025142790086928924}, "score": 4.218001013827523}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3142483758067742, "3": 0.25959153565990595, "5": 0.19758628578480203, "1": 0.13085787086499667, "2": 0.09759222018104369}, "score": 3.35015630389783}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2857234197161045, "3": 0.23702399458429993, "5": 0.20059643004469951, "1": 0.14326604824910186, "2": 0.13315967592561503}, "score": 3.2672860985129963}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3754439261828178, "4": 0.27776479070973353, "3": 0.2090473286046563, "1": 0.07637752511306936, "2": 0.06124570833574584}, "score": 3.8147502420214288}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.43293654892364736, "2": 0.28200586792946447, "3": 0.1937312673631938, "4": 0.06018422525253579, "5": 0.031078314063970505}, "score": 1.9743964782343637}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.32089731435624225, "5": 0.2822940558754971, "3": 0.20760459375935222, "1": 0.10958894240755732, "2": 0.07948327156733696}, "score": 3.586901636292247}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.516304743319729, "4": 0.33363569994484576, "3": 0.10656175529102929, "2": 0.022026068396108885, "1": 0.021271251771440586}, "score": 4.301937628763502}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.43001774659284847, "3": 0.23861070605953646, "4": 0.2038580012118065, "1": 0.07039717813015363, "2": 0.05693656645823732}, "score": 3.866318337056518}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.30664201092406623, "3": 0.30293833773741463, "2": 0.24545471722077242, "4": 0.09732221513223177, "5": 0.04747550429560119}, "score": 2.333423023192049}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4510706724919093, "4": 0.31108341105924153, "3": 0.18328052066932604, "2": 0.0288475936072734, "1": 0.02563234111539129}, "score": 4.133209325471601}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.33028132093534274, "4": 0.3272026419064257, "3": 0.22207391546082741, "1": 0.06579484415683384, "2": 0.05454438527762767}, "score": 3.801713700322674}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.34008040637258213, "2": 0.23914868679647752, "3": 0.22374597741998925, "4": 0.13864036511928915, "5": 0.05823352262168704}, "score": 2.3356975734731504}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5876159445557112, "2": 0.2669202645036326, "3": 0.10798426034769547, "5": 0.019117517837513198, "4": 0.0182173835617605}, "score": 1.614099823996746}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.312487065831951, "3": 0.2990657889085422, "5": 0.2684185400709394, "2": 0.08835292268546299, "1": 0.03159925293393191}, "score": 3.6978260519650124}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.356540015494666, "4": 0.20791519474340797, "5": 0.18696145619065785, "2": 0.15774091032210572, "1": 0.09077168329475352}, "score": 3.2425709896738613}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6805507038279331, "4": 0.23223172294338176, "3": 0.07188168323846823, "2": 0.009662590490399036, "1": 0.0056239405235550015}, "score": 4.572500276065538}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4756575435499757, "4": 0.2970605169979556, "3": 0.16582006902989616, "2": 0.03510803701270806, "1": 0.026259821698027933}, "score": 4.160857057847884}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"5": 0.39731003439971196, "4": 0.35001148876309257, "3": 0.16214762390841095, "2": 0.04671231708217424, "1": 0.04368249190786482}, "score": 4.010691755151841}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9384653446086703, "4": 0.050190831921969305, "3": 0.010158702009130579, "2": 0.0006114439297556347, "1": 0.0005100451534441488}, "score": 4.925612518204439}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7228222338608231, "4": 0.1967263504354155, "3": 0.05655969216703215, "1": 0.012782771388267765, "2": 0.01092420073439357}, "score": 4.606177818269302}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8965909329638778, "4": 0.05849356095193953, "3": 0.035253110940033826, "1": 0.005154716284408329, "2": 0.004424926105427933}, "score": 4.837093092718802}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8145391058494071, "4": 0.15290380206587567, "3": 0.025893575273152412, "1": 0.003853407720362507, "2": 0.0027437930254673934}, "score": 4.771648894083016}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3210474973421992, "1": 0.26094406629741773, "2": 0.21635911119038279, "4": 0.14385077520752065, "5": 0.05769562682124202}, "score": 2.5209454792686885}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.35134813832212214, "1": 0.3055245021957132, "3": 0.2640817934888258, "4": 0.06509075839390364, "5": 0.013895996526602597}, "score": 2.130434468651764}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3301025880347441, "4": 0.22422380420634638, "2": 0.21559196688229493, "1": 0.1668359974985829, "5": 0.06316145835563733}, "score": 2.801266028614329}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.304137858031587, "3": 0.30142760733112517, "4": 0.27410870985045804, "2": 0.0734409350932307, "1": 0.04683333702738038}, "score": 3.715313693093702}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3962493358026004, "2": 0.24939799127469792, "3": 0.21974858095068478, "4": 0.08527784402644249, "5": 0.049119778721934855}, "score": 2.141443473090852}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.43857418607874843, "4": 0.23710438304995748, "3": 0.17252788558678706, "1": 0.08880009137382734, "2": 0.06286884173070487}, "score": 3.8738926283945823}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3050807144024316, "4": 0.2672329043176427, "3": 0.20809262206651927, "1": 0.11653072579735863, "2": 0.1027409610286001}, "score": 3.5417664084998135}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.37904118964606953, "4": 0.2726977336353308, "3": 0.24366915400444264, "2": 0.07031606399071763, "1": 0.03417792196342418}, "score": 3.8921955837546767}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7339957651020511, "4": 0.19634681875484797, "3": 0.05357441269384439, "2": 0.008721447998264345, "1": 0.007262276004744215}, "score": 4.641255291867726}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.44943173740299247, "4": 0.34655480689605483, "3": 0.14286036418707787, "2": 0.03498133659005598, "1": 0.02601239041639359}, "score": 4.15859680348809}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7913181181026172, "2": 0.1491751142045439, "3": 0.04245307630270462, "4": 0.01147571747426179, "5": 0.005515799877916099}, "score": 1.2905896858785624}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4082759847683796, "4": 0.3937045437306933, "3": 0.14733118015675592, "2": 0.030146995877313797, "1": 0.020386731630705774}, "score": 4.139512181502842}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2620191988113025, "1": 0.2322291451855637, "4": 0.1926867433823713, "2": 0.18108149507768778, "5": 0.13186995914173905}, "score": 2.8108654173096443}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.45135238640116787, "4": 0.27384938869967884, "3": 0.17298103755510205, "1": 0.05316077854118873, "2": 0.04849890299278357}, "score": 4.021894655772426}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.527239349458933, "2": 0.23028767286733645, "3": 0.1570859926020033, "4": 0.056467371681811325, "5": 0.02883454879099243}, "score": 1.8292705098440656}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3769240012696168, "2": 0.2793453078189614, "3": 0.20675172535214512, "4": 0.09807644042697318, "5": 0.03878974001207012}, "score": 2.1423658817257722}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5648737636315884, "4": 0.3078889847825541, "3": 0.106942764377147, "2": 0.013467761317953814, "1": 0.006683538607701789}, "score": 4.411003711300175}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.33381467675906923, "4": 0.3294093752654091, "3": 0.23774668996213252, "2": 0.06164112608248879, "1": 0.03726989435799818}, "score": 3.860959611759923}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4433627922313135, "4": 0.2865460565215623, "3": 0.16485741997718917, "1": 0.054690361043978515, "2": 0.05040570579975593}, "score": 4.0136247531665035}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8346351464342995, "4": 0.13354684016774648, "3": 0.02627517242287317, "2": 0.003176082690133299, "1": 0.0022807193075577866}, "score": 4.795234071834813}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"4": 0.27211342389291704, "3": 0.24518356600115498, "5": 0.21201956941690325, "1": 0.14178394416962586, "2": 0.12882221544781264}, "score": 3.283784390101425}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3188582284196918, "5": 0.22122205680428772, "3": 0.20481990462248525, "1": 0.15312296309627946, "2": 0.10153389452882622}, "score": 3.3536791843958627}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.86460024792288, "4": 0.09439520515219256, "3": 0.034758125742144486, "1": 0.0033946405495431727, "2": 0.0027992017268572314}, "score": 4.814102601702872}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8804816338824437, "4": 0.08912152421485202, "3": 0.023734015658255097, "1": 0.004125729608698509, "2": 0.0024655740950592386}, "score": 4.83949932433256}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2611680001489853, "3": 0.22040758226584511, "1": 0.1868738292013668, "5": 0.17302233305718853, "2": 0.15841183285887636}, "score": 3.075061913895001}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"3": 0.35815321832230834, "4": 0.2257982449236136, "5": 0.1966515692937758, "2": 0.12004869822265875, "1": 0.09924785219516258}, "score": 3.3005871649722955}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7534794379554557, "4": 0.2146580890898929, "3": 0.028506310362169822, "2": 0.0019549786623565438, "1": 0.0013649902407561051}, "score": 4.716994150209858}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8975521845182411, "4": 0.08839719858991639, "3": 0.012618762314683585, "2": 0.0007582999031327807, "1": 0.0006336353035687308}, "score": 4.881551107451821}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7981139797219835, "4": 0.17437556260554224, "3": 0.023975279507277198, "2": 0.0017718898325130349, "1": 0.0017067778230950297}, "score": 4.7655178468840225}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4180548855222436, "5": 0.25114397467890254, "3": 0.21091161911685768, "2": 0.07117348013232654, "1": 0.04863061539545987}, "score": 3.751972361311729}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3570638363079983, "2": 0.28455449419912676, "3": 0.21640623933686887, "4": 0.09986916496316584, "5": 0.04195154572106797}, "score": 2.1849639876488722}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3385795523206896, "4": 0.2830222393926977, "2": 0.1873480054342636, "1": 0.09924388236047196, "5": 0.09174323754458064}, "score": 3.0806780337348014}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4814020477033609, "4": 0.3544000922330412, "3": 0.1233617479208389, "2": 0.02580333840197613, "1": 0.014892980267955786}, "score": 4.261791278886734}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5718035446528935, "4": 0.30145268715136114, "3": 0.10011219218780673, "2": 0.017295545433976548, "1": 0.009286270127952516}, "score": 4.409261816263788}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3876908094110819, "5": 0.29235089586715235, "3": 0.21791787660243925, "2": 0.06787758613618208, "1": 0.03410620317316494}, "score": 3.836349970166412}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3004010991932951, "3": 0.28715638963865625, "2": 0.16714641736468938, "5": 0.13208002369122665, "1": 0.11313532617759545}, "score": 3.1711578968178844}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.46190732650600685, "4": 0.3412692581281995, "3": 0.16277218399394183, "2": 0.02227038522339714, "1": 0.011664883041565838}, "score": 4.219625191360114}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.25834202337285733, "4": 0.22500609235746663, "2": 0.22058338330495703, "1": 0.20786137246708317, "5": 0.08802530051267134}, "score": 2.7647077824338884}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.50137427545946, "4": 0.383674965055258, "3": 0.09671225039566571, "2": 0.012507565221803487, "1": 0.005606215421637757}, "score": 4.362873509004211}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.45020240880582335, "5": 0.276093832007605, "3": 0.21493188822486067, "2": 0.038523262476002164, "1": 0.020103702035614075}, "score": 3.9237932698771627}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.544471706668782, "4": 0.22858443918389504, "3": 0.15773837071389343, "2": 0.03931094500600507, "1": 0.02977459993806919}, "score": 4.218813890336128}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.33593623964080455, "3": 0.2634611922067404, "5": 0.25324494413032766, "2": 0.08939298208962636, "1": 0.05780358968242435}, "score": 3.637528641869246}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3521569225590422, "5": 0.2863321438114997, "3": 0.27316843391494455, "2": 0.060791323851710204, "1": 0.027422023803613648}, "score": 3.8092903602396118}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9373330237506416, "4": 0.05434557964506712, "3": 0.007134096252901471, "2": 0.0005851936148113069, "1": 0.0004905318241616673}, "score": 4.927660448428918}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7358585692968936, "4": 0.1956656194266699, "3": 0.052992472702371715, "2": 0.008581024216964704, "1": 0.0068024189643876775}, "score": 4.645361259883926}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"1": 0.36851381803355504, "2": 0.287995218907389, "3": 0.265976851080654, "4": 0.056372603051313336, "5": 0.020962335483440852}, "score": 2.0731083446739227}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.24717121607606182, "4": 0.22216756156279688, "2": 0.19296730665427633, "1": 0.18679789910721953, "5": 0.15071654375181276}, "score": 2.9570298322193236}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4171467919761809, "4": 0.20750469771028843, "2": 0.2064864677923975, "1": 0.10062079831409308, "5": 0.06819755262776485}, "score": 2.936168949665838}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6787413037301565, "4": 0.24732831857293422, "3": 0.05926466612863959, "2": 0.008572824677817484, "1": 0.005962407121475674}, "score": 4.5845200349205735}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2598569478394529, "4": 0.21117198135278445, "1": 0.1970138397842157, "2": 0.19159846978224482, "5": 0.14021494673098633}, "score": 2.905962201464133}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8163902914668464, "2": 0.14226785434543296, "3": 0.03112159275214889, "4": 0.006376495035879589, "5": 0.0037150304661430437}, "score": 1.2385313543785283}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.428655432683389, "2": 0.230573245298728, "3": 0.19885529093764834, "4": 0.10552789008584063, "5": 0.03625480698464315}, "score": 2.0900320637159315}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3276197637223929, "3": 0.2882787168472132, "2": 0.23413303489063297, "4": 0.10018785552723215, "5": 0.04968795645967358}, "score": 2.3101272738444822}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2488980510232089, "3": 0.23525943383569103, "1": 0.19972301446655694, "5": 0.1970452265887859, "2": 0.11898855106938556}, "score": 3.1245646022517195}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4565947696251067, "4": 0.3175724175136603, "3": 0.1456017098228061, "1": 0.044763003297052135, "2": 0.0353630673023097}, "score": 4.105989047594707}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"3": 0.36035302609207737, "4": 0.2321184215103836, "2": 0.16132837417351023, "5": 0.13888236487850966, "1": 0.10716634773620196}, "score": 3.134242414730632}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4737831269830297, "4": 0.32607045543498153, "3": 0.1450653860395277, "2": 0.028827188270296532, "1": 0.026178008262108192}, "score": 4.192543941188301}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3060773289403175, "4": 0.2946510806892608, "5": 0.24468421944701113, "2": 0.09154540502504784, "1": 0.06292190026253097}, "score": 3.566698355031495}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.48283446820585346, "4": 0.34623840825669217, "3": 0.11831870565485712, "2": 0.026341772285070203, "1": 0.026121080726227586}, "score": 4.233502965631312}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.39111233440149884, "4": 0.3521966833200518, "3": 0.17261777877303697, "2": 0.04786168453422609, "1": 0.036069371812755734}, "score": 4.01456514151522}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3407206996239835, "4": 0.28718496312093245, "2": 0.1843239078972267, "1": 0.10273623505309104, "5": 0.08491164786188611}, "score": 3.0672201184276986}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.45767090554108475, "3": 0.2705405998747126, "5": 0.22414063260427203, "2": 0.03391765512559591, "1": 0.013545814125629224}, "score": 3.8450987174313065}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3343923415825176, "3": 0.32933618863356107, "5": 0.18698129385352907, "2": 0.1038021287782149, "1": 0.04525896078696637}, "score": 3.5141526643024563}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5099952841863234, "4": 0.39848532779973045, "3": 0.07794806557614045, "2": 0.00967292628990949, "1": 0.0038319659676744615}, "score": 4.401232122049519}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.2998086923214382, "2": 0.2903324886961736, "3": 0.24198803407960195, "4": 0.12054176362487107, "5": 0.047240325373847085}, "score": 2.325012672422261}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3486993462929081, "5": 0.30500189173015785, "3": 0.2368959414207077, "2": 0.06789021254142268, "1": 0.041434330609769796}, "score": 3.808007504722979}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6834477708518213, "4": 0.21366504509870618, "3": 0.07987933463708076, "2": 0.0124617503245878, "1": 0.010459255487309863}, "score": 4.547314699882776}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.38389158384310446, "4": 0.29313310202294807, "3": 0.25206398877337804, "2": 0.04948830004860457, "1": 0.02135349184973476}, "score": 3.968788349169169}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8918926778075236, "4": 0.08888998477568244, "3": 0.016991280130862093, "2": 0.0011308311337779714, "1": 0.0010305726091494947}, "score": 4.869604240576822}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6664832972949797, "4": 0.2469751635102479, "3": 0.07266244520920175, "2": 0.008205070189481092, "1": 0.005637967222399516}, "score": 4.560517020362867}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2998069834167624, "2": 0.2531233397892821, "4": 0.20631327766935081, "1": 0.18559388618243416, "5": 0.05510831316862037}, "score": 2.6922021092764643}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2941403042909198, "5": 0.2858255840994484, "4": 0.2038919871732597, "2": 0.1110016181331424, "1": 0.10498602845620991}, "score": 3.4546397120904873}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3177711847531447, "4": 0.29782854809872805, "5": 0.20547553566325089, "2": 0.10500768930812052, "1": 0.07373994736264723}, "score": 3.456372856658029}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7759181974598973, "4": 0.17614957269494821, "3": 0.0409978767583704, "2": 0.004251773878285155, "1": 0.002622676284326695}, "score": 4.718591789841475}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8328414009172976, "4": 0.13522185216424185, "3": 0.0269852677710962, "2": 0.002696997936322585, "1": 0.00214433242246658}, "score": 4.794116610988844}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.396227673443558, "3": 0.26540654407078, "5": 0.2503699887935621, "2": 0.05408582187648978, "1": 0.033787154267106136}, "score": 3.775402753685291}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4381208033054066, "1": 0.3373030818953513, "3": 0.20430234479694973, "4": 0.01852499088199699, "5": 0.0017016542718290152}, "score": 1.9091499261851177}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.36679407204631875, "4": 0.329581305930232, "5": 0.1772492934066732, "2": 0.08147586806033652, "1": 0.04481896962735521}, "score": 3.5130073778690036}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7001245998451694, "4": 0.21280913389433592, "3": 0.06905948806151878, "2": 0.01023295381732186, "1": 0.007654312993603825}, "score": 4.58770650278811}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5991716865390094, "4": 0.2719711729783063, "3": 0.10169393641260893, "2": 0.015292580543478325, "1": 0.011756982024695679}, "score": 4.43167069867188}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3739433363991827, "5": 0.3374696832876897, "3": 0.2214024484114009, "2": 0.041676689969903716, "1": 0.025322440502408013}, "score": 3.956738512687671}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.44109434154869903, "4": 0.37111645527859205, "3": 0.16428162471978416, "2": 0.017393799271172752, "1": 0.006026794509811542}, "score": 4.223964216211008}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6206018413029838, "4": 0.3114677118185802, "3": 0.0572803297235169, "2": 0.006586286464484022, "1": 0.003950119292074277}, "score": 4.538359798419775}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6244198127391638, "4": 0.3094287572332172, "3": 0.05834789478454058, "2": 0.004992452534902096, "1": 0.002698712693102888}, "score": 4.548052459468643}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.42184353662011087, "4": 0.36839914332399903, "3": 0.16161749138240936, "2": 0.03073922969204733, "1": 0.017353770088977476}, "score": 4.146693145064189}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4036211695780556, "5": 0.2432257146254439, "3": 0.23326808673236182, "2": 0.06941908147871334, "1": 0.0502918370668174}, "score": 3.7201952367827706}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.33843385903681455, "3": 0.29028673590137, "2": 0.23212508340467863, "4": 0.10202665258273352, "5": 0.03681407625555331}, "score": 2.2664319619466613}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7931308219661258, "4": 0.1458620451795418, "3": 0.049166430267528295, "2": 0.006168719494264869, "1": 0.005502722550711975}, "score": 4.715239846941962}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3066285189724107, "4": 0.22259820588254833, "2": 0.20653198242542728, "1": 0.17905997023595582, "5": 0.08509553606066157}, "score": 2.828122610360082}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.46568717898690376, "2": 0.28504263882262065, "3": 0.1537619425792324, "4": 0.0751710646998418, "5": 0.020264343807670473}, "score": 1.8992025832279067}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6339954507777951, "2": 0.2542569777463426, "3": 0.079988876318084, "4": 0.02458351457291339, "5": 0.007120260266091558}, "score": 1.5164946812181541}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4355606618357857, "4": 0.3159492119466993, "3": 0.16416197272252914, "1": 0.04232125656006062, "2": 0.04197084787125384}, "score": 4.060495404493255}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4601503937492678, "2": 0.17451518867675128, "3": 0.16547049136031777, "4": 0.10695322389096495, "5": 0.09285222760810215}, "score": 2.1977947942114264}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.789761664140765, "4": 0.1621901283706038, "3": 0.03961100085231102, "2": 0.004396478497409531, "1": 0.004006240534425453}, "score": 4.7293641387123}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.23776547269254758, "3": 0.22986897644767348, "5": 0.22348656021562802, "1": 0.1937877676380966, "2": 0.11501271402393068}, "score": 3.1821646453845673}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2701612165075064, "4": 0.2576686813863978, "2": 0.1943650280502565, "1": 0.19004226199561755, "5": 0.08755791665081906}, "score": 2.8583059301820994}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.38373061347068727, "5": 0.36287393192884776, "3": 0.18648784803694265, "2": 0.037210451606504866, "1": 0.029429994606563207}, "score": 4.013678851305914}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4329777664450278, "4": 0.38330960431342925, "3": 0.1454210574632169, "2": 0.02093342950497381, "1": 0.017168046235096514}, "score": 4.194222632219499}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.47479601941058325, "4": 0.39256405799239813, "3": 0.10356301613559266, "2": 0.015274202267527803, "1": 0.013538853366237065}, "score": 4.300147232737001}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6603334792351192, "4": 0.2615097529491465, "3": 0.06215633098516451, "2": 0.008583598910414504, "1": 0.007181543118518991}, "score": 4.55959699133664}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5155093180174144, "2": 0.30649127210946947, "3": 0.13603788035593437, "4": 0.030764018574919023, "5": 0.011083213640057559}, "score": 1.7152736969602265}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.49735048510732677, "4": 0.26616123692076726, "3": 0.15842155964402316, "2": 0.040707757611141655, "1": 0.03718882745665406}, "score": 4.145971762522896}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4409959884773087, "4": 0.3587871368191232, "3": 0.16825833034065849, "2": 0.021389934886539633, "1": 0.010450522519033278}, "score": 4.198629676380592}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6001349094244486, "4": 0.29010223025524423, "3": 0.09057709612910964, "2": 0.010716683995172938, "1": 0.008386278673368852}, "score": 4.46300394671667}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6759490199892864, "4": 0.26413553960228237, "3": 0.05160858728959295, "2": 0.004798441986037476, "1": 0.003425722091001065}, "score": 4.604516369333947}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.38488351458276737, "2": 0.3457445055358438, "3": 0.19222815598823928, "4": 0.05927087146402691, "5": 0.017840115101023388}, "score": 1.9794060533864144}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33219614045735807, "4": 0.25546358601107216, "2": 0.17724360379567358, "5": 0.13940112644795769, "1": 0.0956235835016301}, "score": 3.1657869981050104}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.29332543109198805, "3": 0.26014716210308025, "5": 0.24790719910590225, "2": 0.11205919729972551, "1": 0.08644509555855132}, "score": 3.5042488908168434}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3295334871520778, "3": 0.2789304252842817, "5": 0.22266156634770903, "2": 0.09473111205096758, "1": 0.07408166597749603}, "score": 3.531995022909968}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.42878041681910656, "2": 0.2761885208160688, "3": 0.18963431865052469, "4": 0.08074790996505764, "5": 0.024609535234182103}, "score": 1.9961781772721217}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.40345903120330084, "2": 0.31180527643601286, "4": 0.15209920599701143, "1": 0.0992075657458739, "5": 0.03336177151279405}, "score": 2.708582772688841}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7516200916209664, "4": 0.22076967842124773, "3": 0.026052584569097367, "2": 0.0011058254602991351, "1": 0.0003895957090455503}, "score": 4.7222320093271}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.870116855227233, "4": 0.12074012141787815, "3": 0.00857973458594309, "2": 0.0003342320652887326, "1": 0.00019460027014631457}, "score": 4.8603144990696086}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6173009565578867, "4": 0.33068910658886574, "3": 0.04813919831330936, "2": 0.0027701744013185954, "1": 0.0010479059913679597}, "score": 4.560507206738865}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5824119871382023, "4": 0.34455932405535633, "3": 0.06578588350929362, "2": 0.005139597037303867, "1": 0.002030253737291201}, "score": 4.500292646953623}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"1": 0.957995191820869, "2": 0.0377289528186056, "3": 0.0037071807384996985, "5": 0.0002679679966685135, "4": 0.00021925963114313252}, "score": 1.0468767831487946}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8874666853241957, "2": 0.09937557697368428, "3": 0.011638694492158172, "4": 0.001026511210986396, "5": 0.0004497712669916531}, "score": 1.1275370382360363}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.863059599024454, "2": 0.11690940036586998, "3": 0.0174528957245607, "4": 0.001812948053234897, "5": 0.0006740093329776426}, "score": 1.159964653684703}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.32512885444907874, "2": 0.29208637957434935, "3": 0.25726872957972574, "4": 0.08642575131086735, "5": 0.03886548489442255}, "score": 2.2216376566233142}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6776994353677505, "2": 0.23349745530125499, "3": 0.06768219717780861, "4": 0.015216407386146718, "5": 0.0057945642450776096}, "score": 1.4377374538797847}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4293319427188857, "4": 0.396565323960737, "3": 0.12596086695408698, "2": 0.028960032188033318, "1": 0.018889992396185627}, "score": 4.188836144477098}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4495765676396819, "4": 0.2845081440473441, "3": 0.1866366127515764, "2": 0.047567762765960746, "1": 0.03144271374819241}, "score": 4.073495999668695}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3629150478745096, "3": 0.31481147858502956, "5": 0.19102659878059144, "2": 0.08675010931852974, "1": 0.044251119872293326}, "score": 3.569855878944234}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5920714492974041, "4": 0.32307295964918054, "3": 0.0683560366523244, "2": 0.01000006586009779, "1": 0.006331055570090838}, "score": 4.484803771154092}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3868895760003827, "3": 0.2632647234493122, "5": 0.18876579730954024, "2": 0.09846156598449722, "1": 0.06240288941195608}, "score": 3.5412704413608345}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5431995126073105, "4": 0.2423044949876784, "3": 0.16001181863620864, "2": 0.032008653207595036, "1": 0.022432241551991736}, "score": 4.251884564214313}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9707524019979991, "4": 0.026375078787145956, "3": 0.0026596275095445874, "2": 0.00010158852216687989, "1": 9.394378373190687e-05}, "score": 4.967624563474201}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6652047439993863, "4": 0.16690065897496556, "3": 0.1219655928311335, "2": 0.024375445142708868, "1": 0.02148894633519434}, "score": 4.430049208524892}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9793186991828247, "4": 0.018064427608388802, "3": 0.002227133380598371, "1": 0.0002385239102596103, "2": 0.00013418904079336863}, "score": 4.976124236337303}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.32328868283935136, "4": 0.25129098714453657, "3": 0.22996947413944924, "2": 0.1169269380912214, "1": 0.07846182329041422}, "score": 3.624056518625583}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2764828735728881, "3": 0.26677998139722825, "2": 0.16952231651037283, "1": 0.14357592351064746, "5": 0.143472729524327}, "score": 3.1067719119640795}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9000818458133387, "4": 0.07949479747732249, "3": 0.017730995725185588, "1": 0.0015039684967254954, "2": 0.0011415168851865176}, "score": 4.875596954962188}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.36836853062716396, "4": 0.32585571096353677, "3": 0.2150417034777938, "2": 0.051365270813117904, "1": 0.03931902423531618}, "score": 3.932635860785495}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9358352668022301, "4": 0.05557013846340286, "3": 0.007194916816515849, "1": 0.0008035512430680581, "2": 0.0005372341096917783}, "score": 4.92520971601055}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9643449889865072, "4": 0.03260952680562267, "3": 0.0024506729957588804, "1": 0.00031116911980561674, "2": 0.00018113254533986417}, "score": 4.960697024157369}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5394775541831301, "2": 0.2389633466759858, "3": 0.16276562440710343, "4": 0.03991863585866, "5": 0.018712094490229824}, "score": 1.7592224402161203}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5453800979375615, "2": 0.2045074242003643, "3": 0.1568087451469829, "4": 0.0544015735492985, "5": 0.03872888015588056}, "score": 1.8363900846115095}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30831367158608175, "2": 0.23144759559528838, "1": 0.22009401125945946, "4": 0.16396542443513892, "5": 0.07594734558935616}, "score": 2.6441419556801375}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5238632772424564, "2": 0.19371652497470243, "3": 0.15226488657443804, "4": 0.09225193690700706, "5": 0.03774302079432412}, "score": 1.9261226990446667}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3914331467289704, "2": 0.2422202845818371, "3": 0.20656486493440765, "4": 0.12396533610476691, "5": 0.035692482021724356}, "score": 2.170160916972254}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8151260215713468, "2": 0.14908332517272332, "3": 0.029147585494314017, "4": 0.0048455118220152625, "5": 0.0017308241441595237}, "score": 1.2288536000156576}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.35217681998726375, "2": 0.29894959452100406, "3": 0.23346563176692053, "4": 0.08327204336548494, "5": 0.031927144699789835}, "score": 2.143644320611327}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6505147867027977, "4": 0.15395922259119518, "3": 0.09599541971064225, "1": 0.07100866976708525, "2": 0.028313747921858496}, "score": 4.284925169963393}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.2753995298065616, "3": 0.25299812534136346, "4": 0.19073312105378157, "2": 0.1563610222939943, "5": 0.1243866026768937}, "score": 2.7323136941595485}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6111103075602914, "4": 0.1633806376845619, "1": 0.10646355063195563, "3": 0.09172097416259926, "2": 0.02722470352580503}, "score": 4.145563805565958}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9019821486220507, "2": 0.06230981010595383, "3": 0.02653604716346678, "5": 0.0052396598336435455, "4": 0.003833826072076401}, "score": 1.1478565870703565}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7480943295011271, "2": 0.13136095016683697, "3": 0.07868136003184775, "4": 0.02240058733841361, "5": 0.019254940535169247}, "score": 1.4330351931414465}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4787468921983731, "2": 0.26388483554700065, "3": 0.19735506739599917, "4": 0.04216278580345373, "5": 0.01758082428795129}, "score": 1.85563730023995}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5501982011194536, "2": 0.17217551266067124, "3": 0.14392774156999766, "4": 0.07292651417414708, "5": 0.060649232393717105}, "score": 1.9215206288637363}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6699113558846056, "2": 0.18313763591640786, "3": 0.09388304251227625, "4": 0.03236951481113001, "5": 0.020609956390930183}, "score": 1.550500807223306}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9440577423156953, "2": 0.04789491207191478, "3": 0.007106839135851931, "4": 0.00048023917351760586, "5": 0.00042878325491841864}, "score": 1.0652664957373361}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9603541656532305, "2": 0.03240237034705857, "3": 0.006325033170718076, "5": 0.00046461335169379963, "4": 0.00043126793589603725}, "score": 1.0482057809212109}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9636365579829015, "2": 0.030313012597331004, "3": 0.0051327176691734, "5": 0.0005145751238681025, "4": 0.00037550957040037054}, "score": 1.0437644862262774}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.735993957651203, "2": 0.14800339001109156, "3": 0.07470464550164245, "4": 0.021237569913627123, "5": 0.02000190619939705}, "score": 1.4411588368985448}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9655124329331998, "2": 0.029291731621578297, "3": 0.004260652335606773, "5": 0.0005669984431542455, "4": 0.0003433677938529477}, "score": 1.0411121537220493}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3116749067316126, "1": 0.306724048634043, "3": 0.2291135148982624, "4": 0.11975982501529056, "5": 0.032602050298340464}, "score": 2.259747905662891}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33680006621959, "2": 0.22770132201010104, "4": 0.22309113809599784, "1": 0.12326419503419077, "5": 0.08910229386495584}, "score": 2.9270630244418827}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.399419793955839, "3": 0.2936420413158987, "5": 0.16690262841436113, "2": 0.1003420931068088, "1": 0.03959909557490765}, "score": 3.553737010303712}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.3689709368380499, "4": 0.33418922650838034, "3": 0.18997416305297776, "2": 0.05654393117722114, "1": 0.05022248219753161}, "score": 3.9152330508515196}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31037165887884605, "4": 0.25796217844011443, "2": 0.2189413485225486, "1": 0.1384675329456767, "5": 0.07415422002610676}, "score": 2.910384968246907}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6389836064126337, "4": 0.25288144422071307, "3": 0.07461856068281394, "1": 0.018946366637612025, "2": 0.0144407096787107}, "score": 4.4787064291212575}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5010003596666626, "4": 0.3043563987345081, "3": 0.14485778658724896, "2": 0.02849972046503555, "1": 0.021215133661876367}, "score": 4.23551435868579}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30641658928692794, "4": 0.30391026562952916, "5": 0.2742454968044709, "2": 0.07434739081253218, "1": 0.04100852118876416}, "score": 3.6960867607216334}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9713265494631268, "4": 0.025031366012941248, "3": 0.003205676930970999, "1": 0.0002364085749585193, "2": 0.00015635585917913032}, "score": 4.967141144183484}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6712760269875918, "4": 0.2618631080825824, "3": 0.057281836215998916, "2": 0.005489857390651488, "1": 0.004018028176682983}, "score": 4.591002437233212}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5263044138978799, "2": 0.2568552197764249, "3": 0.16529913617010483, "4": 0.034614763402165696, "5": 0.01681858086290707}, "score": 1.7586539538321635}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4069326281673317, "4": 0.37326143751181545, "3": 0.17201188598368253, "2": 0.0329891024777461, "1": 0.01460856906761607}, "score": 4.125141404892925}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3943764377702972, "3": 0.26644562232623586, "5": 0.24092622805682992, "2": 0.06715670566606056, "1": 0.031017770400802128}, "score": 3.747094349830966}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4884748661000144, "4": 0.37208656506210425, "3": 0.11357482592789568, "2": 0.01699913191590523, "1": 0.008780833009836031}, "score": 4.314585632660977}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5105812481379701, "4": 0.2965870534785099, "3": 0.1467327755361206, "2": 0.02957875239218189, "1": 0.016355451698493197}, "score": 4.25566672582722}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5223687097099415, "2": 0.21308615744752107, "3": 0.12433877278778138, "4": 0.08298656099651004, "5": 0.05710184220819865}, "score": 1.939241544819469}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8983385385676694, "4": 0.08773825252123672, "3": 0.012228316403025435, "1": 0.0008397318023711811, "2": 0.0007994778746955195}, "score": 4.882041185558411}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29240761744276556, "5": 0.22134690550524339, "4": 0.18334000484906945, "1": 0.15239101411011552, "2": 0.15041034298257247}, "score": 3.170859233684702}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8871730090770484, "4": 0.09250895762159381, "3": 0.016512807286179265, "1": 0.00205921795861358, "2": 0.0016811397381858181}, "score": 4.8611761314861335}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5245255968255365, "4": 0.27907226956625747, "3": 0.12576445830890773, "1": 0.03825611737977061, "2": 0.03230182011601905}, "score": 4.219406641148918}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"5": 0.76015968950779, "4": 0.1036659052866243, "3": 0.08860117142122348, "1": 0.03012278550743376, "2": 0.01735788168411077}, "score": 4.546524988152087}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.46339637019453744, "4": 0.27361072347889426, "3": 0.1716515378327023, "1": 0.046399490519193745, "2": 0.04487039750483252}, "score": 4.0628100554868665}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2891937789982361, "1": 0.2804331238759261, "2": 0.2679542826901355, "4": 0.09679649442239997, "5": 0.06555439650546514}, "score": 2.3990439379475514}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3557304136600285, "5": 0.26393722188602886, "4": 0.18681570179528909, "2": 0.11645582062526452, "1": 0.07699154256339395}, "score": 3.4442820283243862}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3807416187212622, "2": 0.282052459147175, "3": 0.2237295550679543, "4": 0.08416272093617244, "5": 0.02926883736829811}, "score": 2.099124331962247}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.40115339245263326, "2": 0.2367042044121427, "3": 0.1928584266352323, "4": 0.12491316038842983, "5": 0.04418285769856393}, "score": 2.1741126539932782}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.2795287023188053, "3": 0.2436084392166415, "2": 0.2218973037191536, "4": 0.16016505527636316, "5": 0.09475032546866621}, "score": 2.568689357276584}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6704047329161892, "4": 0.1502216813804496, "3": 0.12337892107137303, "2": 0.02796431628392382, "1": 0.02796276710371438}, "score": 4.407236399508448}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.34461121859712, "4": 0.20335806230180803, "3": 0.19084055311890616, "1": 0.163936601847103, "2": 0.09716758604838369}, "score": 3.4675799113796084}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3185624970953078, "3": 0.2841135206753815, "5": 0.1893304647523065, "2": 0.11593445391905437, "1": 0.09197165934391978}, "score": 3.3973803867133983}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"1": 0.35590173909749484, "2": 0.25847425081372283, "3": 0.2580575130770376, "4": 0.07584930773443825, "5": 0.05154204998025053}, "score": 2.208517058920294}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.25861712315671515, "3": 0.25061775226070115, "5": 0.23769322674372426, "1": 0.13984596669104538, "2": 0.11314945766232787}, "score": 3.341188277456529}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.36639430112546384, "3": 0.27548750646550635, "5": 0.2589056938495706, "2": 0.06470142842841874, "1": 0.03425325781881126}, "score": 3.7511914111531994}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4636003094607714, "4": 0.31961111111590795, "3": 0.1688287991997194, "2": 0.030898148993366466, "1": 0.016931437127424856}, "score": 4.182204622859446}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6004603667839511, "4": 0.23376365392638299, "3": 0.12536665440254222, "2": 0.02209773863283561, "1": 0.01819466244799942}, "score": 4.376358253011209}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.25019769340415376, "3": 0.22775850499108058, "5": 0.20182017516888817, "1": 0.1818458916092204, "2": 0.1382020685445126}, "score": 3.1519708881398913}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8995788676519321, "4": 0.0786815803399643, "3": 0.01595488064511098, "1": 0.003694832711117453, "2": 0.002025053012001742}, "score": 4.868545652135297}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9091090600033117, "4": 0.07611419504786045, "3": 0.01305186426318269, "1": 0.0008534235432500787, "2": 0.0007966655526938844}, "score": 4.891970305882133}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.915190403589476, "4": 0.07483010512798283, "3": 0.00868537502022206, "1": 0.0006261520030283968, "2": 0.0005356915655113416}, "score": 4.903674720918782}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8768200200174123, "4": 0.10575293577239543, "3": 0.014485422211468757, "1": 0.001642013576033143, "2": 0.0012021868568510897}, "score": 4.855087487326087}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7574199225438542, "2": 0.1924548496572245, "3": 0.03930557156710566, "4": 0.008063886037560074, "5": 0.002721625409854413}, "score": 1.3061546061265532}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5105799972154446, "2": 0.19213623524582807, "3": 0.13751224655322516, "4": 0.10235800069233018, "5": 0.05725851007479926}, "score": 2.0034243117501513}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.295706195607885, "1": 0.20923404939939455, "4": 0.18584971792430915, "2": 0.16867897950659222, "5": 0.14034213727630734}, "score": 2.8793641236073313}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5866753374399974, "2": 0.23633896785141517, "3": 0.11006936731360668, "4": 0.0482708171846981, "5": 0.018565385995482856}, "score": 1.675605830401329}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7677822228835774, "2": 0.16936083869913682, "3": 0.046659547978253404, "4": 0.011862359015572053, "5": 0.004283604289760056}, "score": 1.315417649887052}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6839439152294261, "2": 0.17057148555677726, "3": 0.08352564237147157, "4": 0.03327753946857267, "5": 0.02818668995135084}, "score": 1.5504744833330788}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3462194349117941, "5": 0.33466421269838587, "3": 0.19380629463425914, "2": 0.07277390760817777, "1": 0.05231030975979312}, "score": 3.8383426648131564}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.2826447415889799, "3": 0.27940246771619925, "4": 0.27366405540592775, "2": 0.10349975845992167, "1": 0.06060322315166857}, "score": 3.6143614537198503}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5112753441215149, "4": 0.34489077716598326, "3": 0.10909127083744517, "2": 0.020658091420067873, "1": 0.01389426102502075}, "score": 4.319245845624496}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3926414439203886, "5": 0.3125959552931295, "3": 0.2114274849589842, "2": 0.04842631571006722, "1": 0.03476274540402535}, "score": 3.9000129991291783}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.365752794004878, "2": 0.2452589715407079, "3": 0.24165654413760027, "4": 0.08648009561676727, "5": 0.06046791410500553}, "score": 2.2303560668340676}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9060229338131368, "4": 0.08219523064119202, "3": 0.01038410819167149, "2": 0.0007620901516680214, "1": 0.0005539899567452492}, "score": 4.892525547700479}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3734468563780017, "3": 0.3332400426132105, "5": 0.1688337121892598, "2": 0.09127877443076438, "1": 0.032877192457023356}, "score": 3.554260381374942}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8005431133255237, "4": 0.1730919366358855, "3": 0.022892141345608824, "2": 0.0021388985044663734, "1": 0.0012069219541215315}, "score": 4.7698501710225845}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.739777103236417, "4": 0.20559957757490568, "3": 0.04411598899474622, "2": 0.006190029045316206, "1": 0.004220073643584968}, "score": 4.670686044351034}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3780466039837326, "3": 0.30852382811409823, "2": 0.12676894249306436, "5": 0.11874228578357776, "1": 0.06775223031402255}, "score": 3.353316461583956}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8111993479132632, "4": 0.158905038074198, "3": 0.027503747798872866, "2": 0.0011886500827538065, "1": 0.0011673722456220855}, "score": 4.777844064165427}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6762843332870256, "4": 0.23154345789154296, "3": 0.07916641683095868, "2": 0.0074085762287859425, "1": 0.005459418482139775}, "score": 4.566000501881457}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8949661076247613, "4": 0.09421202986313779, "3": 0.009937680854224942, "2": 0.00043391560556353703, "1": 0.00040223281306610276}, "score": 4.882996310293238}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9478645942484358, "4": 0.047991181677692285, "3": 0.0037661802026930694, "1": 0.000168417086083408, "2": 0.00014454134019691142}, "score": 4.943365479469032}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5637990417111524, "2": 0.2759054346652048, "3": 0.1131096247512805, "4": 0.033650488698844266, "5": 0.013471788780663553}, "score": 1.6570051049668435}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.3749678462579603, "2": 0.3582891632625825, "3": 0.22161006621117885, "4": 0.03714355532451897, "5": 0.007905635653330712}, "score": 1.9446416022214499}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.4707753983278071, "2": 0.29357498113222663, "3": 0.15761905523747802, "4": 0.05957902478448864, "5": 0.018378593286397644}, "score": 1.8611273559629133}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.3607700875983794, "4": 0.3290680864275743, "3": 0.2122075868802637, "2": 0.05686455880583643, "1": 0.040994814331359625}, "score": 3.9118405767843485}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.30905964339954206, "3": 0.2868963437682108, "1": 0.26391188512891156, "4": 0.10196371135793704, "5": 0.03784719160007921}, "score": 2.3405628533712504}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3368876456216361, "4": 0.2535208020370067, "2": 0.20543783436165686, "1": 0.12482270606155721, "5": 0.07918777881182129}, "score": 2.9568069264977885}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4032945865818971, "3": 0.3230041847374204, "5": 0.1896537950951484, "2": 0.05775614663534462, "1": 0.026222551347075265}, "score": 3.672447148503013}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.35870763839835446, "4": 0.29033963096324505, "5": 0.19394280169798336, "2": 0.10312510666505716, "1": 0.05381171955189672}, "score": 3.467510864907835}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8371501197790829, "4": 0.1457220265190745, "3": 0.01529018132581461, "2": 0.001027285903221134, "1": 0.0007205231590612376}, "score": 4.817717279954127}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4634402373711408, "5": 0.4006528088700619, "3": 0.110586196863669, "2": 0.0172342223573385, "1": 0.00797672781387372}, "score": 4.2316934253460845}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4673157806490101, "4": 0.32523437588227405, "3": 0.13384812731986193, "2": 0.039545890366123625, "1": 0.03384236361176222}, "score": 4.152881416160608}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.336717728669575, "2": 0.2133656112515487, "1": 0.1867337077012214, "4": 0.17986971423037187, "5": 0.08291601922365167}, "score": 2.7587729060570765}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7388225711702104, "4": 0.19355712315013593, "3": 0.05524695794053201, "2": 0.0064842378057656065, "1": 0.005782489382522563}, "score": 4.6533293278033865}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5186283712441392, "4": 0.3148611282699772, "3": 0.12009828857472753, "2": 0.02559450497375011, "1": 0.02061410559275483}, "score": 4.285556895711588}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6185317219154806, "4": 0.28582661307340335, "3": 0.07317080327097632, "2": 0.012753409899961583, "1": 0.009521158941840448}, "score": 4.491387077812769}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3519311567241575, "1": 0.3150926047587606, "3": 0.2546670177207642, "4": 0.061388571074918546, "5": 0.016661468514493846}, "score": 2.1123650835732963}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5080658722635096, "4": 0.3587100058765805, "3": 0.1068463561797669, "2": 0.015316210525489204, "1": 0.01088427382378184}, "score": 4.337994193621891}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3639847892475449, "3": 0.2819321894226906, "5": 0.2327188747538572, "2": 0.07394108141542988, "1": 0.047086040590945406}, "score": 3.6615323288062855}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.687004992282113, "4": 0.251056340724754, "3": 0.051606713931876005, "2": 0.005529264356801655, "1": 0.004649460907382324}, "score": 4.610484910172419}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.45565902562281624, "5": 0.309157569005168, "3": 0.18930422536832311, "2": 0.03097505734924128, "1": 0.014733853113382987}, "score": 4.01370400297251}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2834778186411551, "5": 0.28245989586866, "3": 0.23876188995563993, "1": 0.0976825640535239, "2": 0.09752283726953878}, "score": 3.555562420215926}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.323328094131859, "5": 0.30752835026549613, "4": 0.20100419509931297, "1": 0.08842248380432642, "2": 0.07951124665252907}, "score": 3.559819797140028}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3237634896382936, "2": 0.3048620194445824, "1": 0.2389108760865373, "4": 0.10117202430693996, "5": 0.03118427243137881}, "score": 2.380790345153169}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5008157850622461, "4": 0.3046490562833893, "3": 0.13810458756028327, "2": 0.03012926561550705, "1": 0.026141834328705024}, "score": 4.224062894852319}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32843346612612256, "3": 0.2672132366996621, "5": 0.23196587700695473, "2": 0.10015126358753276, "1": 0.0721623959846928}, "score": 3.547929580194986}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"3": 0.33420125753709196, "2": 0.2546482749180036, "4": 0.19387516624505985, "1": 0.17573621265303455, "5": 0.04140109289787112}, "score": 2.6705111837607656}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.42595462179269017, "4": 0.3217881722729651, "3": 0.16825405663334414, "2": 0.05002674582854303, "1": 0.03385424098091613}, "score": 4.056091202800599}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7687441112910127, "4": 0.19309412783094285, "3": 0.03537682974910742, "2": 0.0019047014535147626, "1": 0.0008249168207878966}, "score": 4.72712334744053}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8647249236209065, "4": 0.1090294772311705, "3": 0.022525438689633075, "2": 0.002060275638571417, "1": 0.0015960922194716062}, "score": 4.833343818164776}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2693745738825231, "2": 0.24362437172955376, "4": 0.21698963316848138, "1": 0.20354063773626235, "5": 0.06642393636732688}, "score": 2.699117763236053}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3703283997894608, "2": 0.30408339181880845, "3": 0.22012073229436033, "4": 0.07664039433830344, "5": 0.02847746802520207}, "score": 2.0885364788260583}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33872557930480546, "4": 0.3016730089583498, "5": 0.14799547204153357, "2": 0.14604936470555366, "1": 0.06536642706218657}, "score": 3.320942760812328}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3849231557772225, "4": 0.23164420120580803, "2": 0.21897274696314112, "1": 0.09074451032077223, "5": 0.07363657012141302}, "score": 2.9784538756729817}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3406015363661239, "2": 0.2556389452826781, "4": 0.17887640258324916, "1": 0.1737102495985726, "5": 0.05105644467142413}, "score": 2.6778923471908316}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.38046755678759964, "1": 0.3106672112548303, "3": 0.2199806920258681, "4": 0.07228889917408805, "5": 0.016536768224226155}, "score": 2.1035076775510944}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3713853040163571, "2": 0.3050576816779905, "3": 0.21969964839054984, "4": 0.075763570660845, "5": 0.027761872290352534}, "score": 2.083154703522596}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.37504261105014947, "2": 0.23807441169407706, "4": 0.21526617356149053, "1": 0.09936785579132526, "5": 0.07215217851283544}, "score": 2.92275293215879}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3905021905949301, "3": 0.28305654376691525, "1": 0.2456162795728883, "4": 0.06697060414312515, "5": 0.013763790665561463}, "score": 2.2126921125226997}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.38263855730072677, "4": 0.27108046048784323, "2": 0.18602273156895252, "5": 0.08847617254487994, "1": 0.07154545478606938}, "score": 3.1189473101429352}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3704514988879904, "2": 0.3028148549507956, "4": 0.15367144956286888, "1": 0.14021090859866983, "5": 0.032751756000578926}, "score": 2.6359020500190633}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3812997758408953, "3": 0.22373512600323334, "5": 0.1636553314822633, "2": 0.14667451951845303, "4": 0.0844942157182911}, "score": 2.5024606387915664}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2821375672120057, "5": 0.21005552047362747, "4": 0.20679101191206706, "1": 0.17169821623147974, "2": 0.12921414657668917}, "score": 3.1543074504418485}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6002739767932948, "4": 0.24615233173533083, "3": 0.11905351274698843, "1": 0.01754512404265787, "2": 0.01693049237959185}, "score": 4.394741697757952}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6606363908307147, "4": 0.2439713203857246, "3": 0.06748542029929869, "1": 0.015976082801723697, "2": 0.011816953988535153}, "score": 4.5216481942468}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3468675056667086, "4": 0.2354250441624406, "3": 0.19052541142583657, "1": 0.14573358273397533, "2": 0.08138136202032896}, "score": 3.5563488556725322}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6539024353994428, "2": 0.12811429292449392, "3": 0.1227744434691635, "4": 0.048777931098436325, "5": 0.04614644280433526}, "score": 1.7047832229967297}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8622156375779068, "2": 0.07392606550671152, "3": 0.038182346641047915, "5": 0.012930690301971073, "4": 0.012647086582724489}, "score": 1.2399783392318673}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7102170013071226, "2": 0.14883748097928962, "3": 0.09830016237492639, "4": 0.028732749764702054, "5": 0.013792071236702525}, "score": 1.4868630236819529}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6968151300919331, "2": 0.09481136433067204, "3": 0.09001694937447531, "5": 0.06761016076862755, "4": 0.05059992423610581}, "score": 1.6971877967944076}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8925892592186704, "2": 0.055709310033104434, "3": 0.029057809564168053, "5": 0.012702992288529495, "4": 0.00990527931336536}, "score": 1.1943596067865436}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5662318815270732, "2": 0.27468227854313393, "3": 0.11221109554584277, "4": 0.0334177026482993, "5": 0.013394273689018566}, "score": 1.6529756583423645}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.37023453343817686, "3": 0.2871868872666312, "1": 0.26937010230171093, "4": 0.05854197269767251, "5": 0.014570499158902331}, "score": 2.1786293771747833}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7086198882369682, "2": 0.25989730675724115, "3": 0.027749679178268538, "4": 0.0032578930377136998, "5": 0.0004453757277603907}, "score": 1.3269616092510155}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2903564711502016, "4": 0.2538366319988987, "2": 0.1611321730777472, "5": 0.15700914922708792, "1": 0.13747682796062366}, "score": 3.131793977117243}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.5303702136310083, "2": 0.2586361322138414, "3": 0.15776613511033427, "4": 0.03646559739443113, "5": 0.01664927844718738}, "score": 1.75024681861139}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5238683325474736, "2": 0.2583260324965333, "3": 0.16588141721907837, "4": 0.0322458411708024, "5": 0.019427222011577126}, "score": 1.7647273432486403}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.47589625508866357, "2": 0.21003004228427744, "3": 0.17676151991621078, "4": 0.08019391819220797, "5": 0.056663648147730554}, "score": 2.031258256170136}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30726208454482806, "1": 0.2468665924019598, "2": 0.18898699042912054, "5": 0.14071106154584961, "4": 0.11607760534145273}, "score": 2.714752264765353}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.3732896720747666, "2": 0.23821965756599556, "3": 0.22422032876431594, "4": 0.09667517802609138, "5": 0.06745231332701779}, "score": 2.246673190047633}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.553587585481316, "2": 0.17181887660537648, "3": 0.11710193314707482, "5": 0.08891686028010795, "4": 0.06845715526405717}, "score": 1.967175379212574}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7951764971296786, "2": 0.171555199704006, "3": 0.02961047781653557, "4": 0.002761647105220514, "5": 0.0008162975702923504}, "score": 1.24234564566749}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29650224170987605, "1": 0.22851557706696782, "2": 0.19682036874483905, "4": 0.18268958924641487, "5": 0.09534161404411054}, "score": 2.7194846565746937}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.48657511038125345, "2": 0.3032806999025238, "3": 0.17450326969640242, "4": 0.028484699372314338, "5": 0.007083561932337417}, "score": 1.7661312512539882}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5471687079898631, "2": 0.25247738465518776, "3": 0.14671754546447435, "4": 0.03985145350528186, "5": 0.013690939709493876}, "score": 1.7202982804134763}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.315915817879904, "2": 0.21622297761153086, "4": 0.17764928167635996, "1": 0.1736181381123111, "5": 0.11650436952818967}, "score": 2.8471851029232687}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3656467045083627, "2": 0.29843270961134355, "3": 0.21839926510956334, "4": 0.08663940013179043, "5": 0.030814140106108695}, "score": 2.118481811943452}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5144378643501151, "2": 0.30650656640553725, "3": 0.13935192653461714, "4": 0.03017625265055583, "5": 0.009508862695071023}, "score": 1.713787852814165}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.40676750400177725, "4": 0.25715792208067184, "3": 0.18494536904012274, "1": 0.0854747729322692, "2": 0.06557154777887972}, "score": 3.8342409818090615}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.3045908434111506, "2": 0.27694354561782414, "3": 0.254798740089511, "4": 0.12552705072637957, "5": 0.038066098351881045}, "score": 2.315483551203054}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3670041951743943, "2": 0.3484036700662504, "3": 0.19387146326474813, "4": 0.06860121726637013, "5": 0.022091956411272082}, "score": 2.030346406316837}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.25807929405028546, "4": 0.23892528284672473, "5": 0.23424774134043874, "1": 0.14177146773151025, "2": 0.1268257223375711}, "score": 3.297096818330326}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.96141399858803, "4": 0.03417644550908701, "3": 0.004050247048882592, "1": 0.0001780676542193966, "2": 0.00016321780861045182}, "score": 4.956520352699748}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6712201120234343, "4": 0.2233171992587105, "3": 0.08905251741198034, "2": 0.009725511446118149, "1": 0.006642412853165722}, "score": 4.5428122653530725}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8142355022659706, "4": 0.14627089957542713, "3": 0.03382249044469725, "2": 0.002953003178080407, "1": 0.002670351946735781}, "score": 4.7665325535389576}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8157108233304943, "4": 0.1463739105443348, "3": 0.03306112692184725, "2": 0.002450047173796629, "1": 0.002375604375437724}, "score": 4.770644742795599}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6686247754294423, "2": 0.17106030907653375, "3": 0.08915275786875353, "4": 0.038220723900153165, "5": 0.032390147238761}, "score": 1.5939160033362143}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3977505416420956, "4": 0.3382754752200237, "3": 0.20030539541563197, "2": 0.042567756583593686, "1": 0.020851191209900286}, "score": 4.049768483630283}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28844890916470894, "5": 0.2669457032169752, "4": 0.26546868301582677, "2": 0.1081283317858985, "1": 0.07078458698033381}, "score": 3.549785617937483}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4030085505559964, "3": 0.24423431673700233, "5": 0.20770044616086383, "2": 0.09309957124747492, "1": 0.05180753898788513}, "score": 3.6217877983794464}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.316433648742369, "3": 0.27320774568099865, "5": 0.22448522205546947, "2": 0.1059602664450483, "1": 0.07973563332025399}, "score": 3.5000613125276594}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6117919409740111, "4": 0.31310511943029806, "3": 0.05965387322638313, "2": 0.008172272148694223, "1": 0.00722806220625826}, "score": 4.514134391636018}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4725944111738273, "4": 0.3653947510806698, "3": 0.11573143357052537, "2": 0.02398167696523269, "1": 0.02220503531126445}, "score": 4.242306977632815}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.34873620576179987, "4": 0.26607275302075467, "5": 0.17176819751231165, "2": 0.11383887585837982, "1": 0.09951080975149727}, "score": 3.2967703638385513}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8608602663514165, "4": 0.1262218128889223, "3": 0.011341841546451637, "1": 0.0007652870237967809, "2": 0.0007271411101660764}, "score": 4.845839036861546}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.628240094182932, "4": 0.29422955999864786, "3": 0.05925182486689047, "1": 0.009725669973246708, "2": 0.008484465294659778}, "score": 4.522878086182357}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6444725362507318, "2": 0.246999145962954, "3": 0.0834211170190752, "4": 0.017974377633140776, "5": 0.006950205857916463}, "score": 1.4956558516537453}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6934410267317, "4": 0.2176750553476759, "3": 0.06793567346377105, "2": 0.010863895794812976, "1": 0.010010122980162071}, "score": 4.573789782675692}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4847893801975832, "4": 0.321333870937207, "3": 0.1542011900975109, "2": 0.024552318236854203, "1": 0.01494718935246281}, "score": 4.236683654005167}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8053351361509604, "4": 0.1372755993188645, "3": 0.04009443629725715, "1": 0.011209507240507819, "2": 0.0059779020519921304}, "score": 4.719733687058243}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5097064383856047, "4": 0.21025430599123246, "3": 0.14945820357333586, "1": 0.07614789826166408, "2": 0.054323590438800785}, "score": 4.02315989662552}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3989788384360047, "2": 0.28615616091217083, "3": 0.22672895630607542, "4": 0.06300661236019416, "5": 0.02506296551307662}, "score": 2.0289541636108077}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6566318484427366, "4": 0.24496510675217434, "3": 0.07425948985286995, "2": 0.01246601671187443, "1": 0.01151636743803185}, "score": 4.522975511234757}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6175164939416825, "4": 0.22528599388222315, "3": 0.12249405264655217, "2": 0.019235277808838658, "1": 0.015414762882806335}, "score": 4.410329516354952}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8886783499655683, "4": 0.09321368810455752, "3": 0.015503966260754804, "2": 0.0014308737604702025, "1": 0.0010985757619168337}, "score": 4.8670815464863155}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8308085298509212, "4": 0.12878047093285006, "3": 0.03138313287440957, "1": 0.005154047245656167, "2": 0.0037511695785999487}, "score": 4.776556160320768}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31856905955034104, "4": 0.24627112889290265, "5": 0.19770859001547197, "2": 0.13311683203585375, "1": 0.10422127456639498}, "score": 3.300162880661149}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4009211517748425, "4": 0.33421121688296, "3": 0.18348051544249486, "2": 0.042788008109963534, "1": 0.038564797518708026}, "score": 4.016170782380223}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5019391709695117, "4": 0.35341707638127196, "3": 0.12134147507479118, "2": 0.015046583853966258, "1": 0.008161763648214098}, "score": 4.326049863129344}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7223390369821165, "4": 0.2161025965585144, "3": 0.05172434078720691, "2": 0.005666650933721349, "1": 0.004135605617189694}, "score": 4.646895128765681}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.28829638887419806, "1": 0.2840466482238108, "3": 0.24996986709610242, "4": 0.12974598519957944, "5": 0.04787585368977979}, "score": 2.369066834504403}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6984591740673004, "4": 0.22833103388850998, "3": 0.060927515003671245, "2": 0.006940785683446758, "1": 0.005280916060531119}, "score": 4.607844159855376}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.45281937667436584, "4": 0.3158916512442218, "3": 0.17723160480986686, "2": 0.035088459210419046, "1": 0.01887324817641306}, "score": 4.148805343616437}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.35246547668795, "4": 0.3135801781291171, "5": 0.24060644225748573, "2": 0.06130612025475616, "1": 0.032001500072995716}, "score": 3.669510911882057}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6612246916759473, "4": 0.25034532856420216, "3": 0.07334795168533764, "2": 0.009017422857299956, "1": 0.006033837918348855}, "score": 4.551757356604453}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7390709607337788, "4": 0.21066090996336964, "3": 0.04203474251097728, "2": 0.004759796327474256, "1": 0.003429581626586283}, "score": 4.677257686011758}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3958981689152882, "5": 0.3829820950925033, "3": 0.14209622642532355, "1": 0.04096197834413114, "2": 0.0379479270431999}, "score": 4.0421088632912525}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9323912148012548, "4": 0.059825714625122296, "3": 0.006872880320411669, "1": 0.0004227726474025631, "2": 0.00038361159063183897}, "score": 4.923578666378431}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7571172877225266, "4": 0.19712234547327584, "3": 0.03858678571933553, "2": 0.0039309407702704515, "1": 0.003158274325737779}, "score": 4.701252959384791}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8483790925354214, "4": 0.12960085472310806, "3": 0.018857774684805137, "2": 0.0017910314428992832, "1": 0.0012788602850485886}, "score": 4.822178632175048}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3625389000362261, "4": 0.35651545073386415, "3": 0.18358529437506144, "2": 0.054246489409557494, "1": 0.04301567907924339}, "score": 3.941407836652722}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.33619827126660706, "2": 0.31895217789186203, "3": 0.22801136608961234, "4": 0.09105893907299553, "5": 0.025699053925394733}, "score": 2.1510402469274346}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.43103960592623, "2": 0.3189429922014133, "3": 0.16714979375642156, "4": 0.05917861709851402, "5": 0.023570628432521275}, "score": 1.9251704503058547}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2706917119322425, "2": 0.26646400770846473, "1": 0.23343897151410214, "4": 0.15080867477946788, "5": 0.07844667377506964}, "score": 2.5742962329322965}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.3479951277583743, "2": 0.253525314747446, "3": 0.21294192564550032, "4": 0.1277629097767656, "5": 0.057504159193200725}, "score": 2.2930643873645535}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6208248573998731, "2": 0.25352997965615437, "3": 0.0913834033147341, "4": 0.02527370630887051, "5": 0.00887867451010087}, "score": 1.5476925092076872}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"3": 0.42299360003128444, "2": 0.20696731432420643, "4": 0.16233405483641972, "1": 0.11371067445529767, "5": 0.09396123268731223}, "score": 2.91586507011897}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5779145665335709, "2": 0.24897360304613392, "3": 0.13418288447798693, "4": 0.023928886731986638, "5": 0.014968773716071424}, "score": 1.6490214320186332}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.49282472280084744, "2": 0.2825437141535919, "1": 0.13516473299897577, "4": 0.07436766067392424, "5": 0.01507661215195829}, "score": 2.5516375910164832}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9718738042198648, "4": 0.024795165111472322, "3": 0.0029859650038823846, "1": 0.0001765672913750998, "2": 0.00014468971571557877}, "score": 4.968091806876869}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.23081882120293376, "5": 0.22828379708441435, "1": 0.21889447819747726, "4": 0.20814914769850587, "2": 0.11372200060250617}, "score": 3.113220702287751}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3238118635170843, "4": 0.3197056340959988, "5": 0.1993623411745912, "2": 0.09753223892420403, "1": 0.05950937594126529}, "score": 3.5019187495226403}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3250484275197094, "4": 0.23915373288700498, "5": 0.17299482469320532, "2": 0.15441927671408248, "1": 0.10831686632803349}, "score": 3.2141046904817165}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3803040175286458, "5": 0.321687983036393, "3": 0.223815394188169, "2": 0.0491127600070546, "1": 0.02496882830251201}, "score": 3.9247322279290517}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.46283947096214867, "4": 0.2115988105993181, "3": 0.16949017812597755, "1": 0.08057730861000936, "2": 0.07540242067806077}, "score": 3.900803418310231}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.34364765680108944, "5": 0.3355923498801721, "3": 0.20488344961221755, "2": 0.06106649662128732, "1": 0.054679653719567387}, "score": 3.8445166718722175}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"5": 0.34684731856532913, "4": 0.3177845632016371, "3": 0.17910893192457616, "1": 0.0887037423023704, "2": 0.06721608499839007}, "score": 3.7671159584396086}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7535850982499159, "4": 0.20933368944774497, "3": 0.032906173316940165, "2": 0.0021287230203665976, "1": 0.0019470906400065168}, "score": 4.710650721521047}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.34728271156963064, "3": 0.3171993939016211, "5": 0.22556130375030206, "2": 0.07549594747466566, "1": 0.03435292881663243}, "score": 3.6542739887494564}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7982014657898872, "4": 0.17830029492859936, "3": 0.021170402103313373, "2": 0.0011289712038839385, "1": 0.001122827299503338}, "score": 4.771463300427328}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9346803273832048, "4": 0.057173990245432106, "3": 0.006981370742787472, "1": 0.0006867130764977629, "2": 0.00044311155609182726}, "score": 4.924784487337644}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.41376646438792086, "2": 0.22290223761301217, "4": 0.20680974802647947, "1": 0.0925376398439713, "5": 0.06384916973215235}, "score": 2.926520669555713}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4370460988897233, "5": 0.2671043694889077, "3": 0.23211519508674824, "2": 0.049007820086655544, "1": 0.014511983827971994}, "score": 3.8934147167248585}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.47382562723562793, "5": 0.2944666573873804, "3": 0.19016404207064538, "2": 0.03111491477491686, "1": 0.010379460266949659}, "score": 4.010934944039815}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4452121361307608, "5": 0.329557412151712, "3": 0.18571740287818422, "2": 0.029838165005237182, "1": 0.009608347760209815}, "score": 4.055342318243}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.34635008815076995, "3": 0.31133374722680557, "5": 0.1605631750241575, "2": 0.12987138037740203, "1": 0.051748713864779416}, "score": 3.434165328648075}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3036047767162341, "3": 0.2897304415970047, "5": 0.21480975565295882, "2": 0.10675799874339244, "1": 0.08492224549681794}, "score": 3.4567016214136506}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7552272587946576, "4": 0.20036737949341596, "3": 0.03670649735299967, "2": 0.004141142761028655, "1": 0.003492370314822626}, "score": 4.699807098266911}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5849236810526222, "4": 0.29067042900514434, "3": 0.09929274222279551, "2": 0.01360111369846344, "1": 0.01140706931982387}, "score": 4.424252034961491}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9065545174499154, "4": 0.0822404997966379, "3": 0.009789626248819336, "1": 0.0007044585953744492, "2": 0.0006804082311497106}, "score": 4.893317935928984}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8350901382144782, "4": 0.14082150676673283, "3": 0.020446531902397595, "2": 0.001920695344331539, "1": 0.0016414701594798784}, "score": 4.805942004560938}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"2": 0.37361392531313004, "1": 0.24601381157795288, "3": 0.23971384008831156, "4": 0.1178902231280325, "5": 0.022614314234321073}, "score": 2.2973691783211363}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4425440683505893, "5": 0.3297929650639513, "3": 0.16190668957073473, "2": 0.040005377356145136, "1": 0.02568355693043051}, "score": 4.01082557901366}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4012313040064146, "4": 0.3656305798442453, "3": 0.18494618280153682, "2": 0.0331019660858197, "1": 0.014988280249003881}, "score": 4.105127038340739}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6985031993364836, "4": 0.24332341368909635, "3": 0.046654830936403276, "2": 0.006810225815312942, "1": 0.004579999454320711}, "score": 4.624568069706784}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4872902682935289, "4": 0.37548513341492185, "3": 0.10176470949973504, "2": 0.021410444826928412, "1": 0.01390302828977992}, "score": 4.301039661195824}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4216124296911251, "4": 0.2677908268622829, "3": 0.1871886026634817, "1": 0.06484023874875422, "2": 0.05845472242845673}, "score": 3.9229849493913913}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5025127330333962, "4": 0.31114246029425563, "3": 0.14405965418739883, "2": 0.025119722108576437, "1": 0.01712355975959632}, "score": 4.256853709973313}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5399196752635863, "4": 0.335252701059903, "3": 0.09984976226944624, "2": 0.013893571886764685, "1": 0.010967159189398312}, "score": 4.379425733914182}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6889853781754346, "4": 0.2552523028598998, "3": 0.0449036273586181, "2": 0.006431089596219058, "1": 0.004355769460059001}, "score": 4.618196669887259}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2879025569560522, "4": 0.2858768372213826, "5": 0.23046727513697202, "2": 0.12329626022121593, "1": 0.07235726617905121}, "score": 3.478848386036956}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9037893279970884, "2": 0.06577379317504038, "3": 0.021175733481755363, "5": 0.005252450234085746, "4": 0.003908996451299298}, "score": 1.140876095586851}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5901631233746433, "4": 0.2844207565688967, "3": 0.10334472854594014, "2": 0.012073878036407816, "1": 0.00980856495499395}, "score": 4.433326820351906}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3503314404080252, "4": 0.21418314761442364, "2": 0.17426356229052228, "1": 0.15936697775360234, "5": 0.10164451500296551}, "score": 2.9244587692011934}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5255182659959754, "4": 0.33968080878827916, "3": 0.10825710274278535, "2": 0.014763410836831284, "1": 0.011718939327444826}, "score": 4.3525991986839765}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2736175364707303, "4": 0.2561418209016883, "2": 0.1642988751960139, "1": 0.16408028963722704, "5": 0.14175907744669386}, "score": 3.0472053551693876}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3289572091663161, "2": 0.31377883135283013, "1": 0.22508364281806995, "4": 0.11065546762655731, "5": 0.021424636088716555}, "score": 2.3894974425542763}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8325717705271966, "4": 0.13501059798936904, "3": 0.027889240770423172, "1": 0.0023614722965277636, "2": 0.0021321231749086835}, "score": 4.793361471721438}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3751254783678099, "3": 0.3211906201043028, "5": 0.18173647150034603, "2": 0.08573381132258595, "1": 0.03617101035137679}, "score": 3.580547325508877}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.46527865258691486, "4": 0.416090218849451, "3": 0.10367363905162452, "2": 0.010872963325068877, "1": 0.0040204155944128}, "score": 4.327818856763064}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6819425378774568, "4": 0.23211531114437484, "3": 0.06770599842234994, "2": 0.010330488577690347, "1": 0.007841981768249472}, "score": 4.570085921326269}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"1": 0.30220173135212464, "2": 0.29210559949045367, "3": 0.21560958146553513, "4": 0.14730158429566623, "5": 0.04274327097851603}, "score": 2.3362536874317232}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5596721013769115, "4": 0.30902308380627047, "3": 0.09851402058195993, "1": 0.018081788634715372, "2": 0.014661470215513667}, "score": 4.377607724188187}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.42956801136532136, "4": 0.32015039795224415, "3": 0.15728019228801593, "2": 0.047315407337626535, "1": 0.04550651392888126}, "score": 4.041144847174407}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8229914888290804, "4": 0.15004578471892893, "3": 0.023375923419736832, "1": 0.001909881654190646, "2": 0.001644669215150496}, "score": 4.79062208128864}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6543713992181135, "2": 0.24663980155458212, "3": 0.07142993069973734, "4": 0.02115596669579412, "5": 0.006374808038492695}, "score": 1.4784802375202917}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.34336059042169453, "2": 0.263008717754032, "1": 0.19277615149923566, "4": 0.12992391098459957, "5": 0.07085944584471218}, "score": 2.62305494965514}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8441826481823306, "4": 0.10597327916473237, "3": 0.03496427685527495, "1": 0.009164554570657681, "2": 0.005624298779976693}, "score": 4.770546185410778}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7214112615117594, "4": 0.16950997573494053, "3": 0.08463702164462175, "2": 0.012933126673522956, "1": 0.011434187589347654}, "score": 4.576648341869275}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8828921820209784, "4": 0.0898740529868051, "3": 0.02136259678388913, "1": 0.0035529643349633596, "2": 0.0022670020572053743}, "score": 4.846380024312194}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3037346866254616, "4": 0.2744082274943261, "3": 0.20195192600082393, "1": 0.12116737799907815, "2": 0.09860971429153716}, "score": 3.5410024153304076}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3203022813022821, "3": 0.2201898830759357, "2": 0.21078782924734613, "4": 0.15626224897472363, "5": 0.0921381958680311}, "score": 2.4889829474668526}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2512570902767659, "1": 0.24253935332943385, "4": 0.20294588740142253, "2": 0.1976764056768937, "5": 0.10510055714700597}, "score": 2.730262224747238}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2765804339393213, "1": 0.2640251540189228, "2": 0.21436453040831574, "4": 0.1327984385387858, "5": 0.11208203729145129}, "score": 2.6144900772558772}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6972652368043525, "4": 0.21051661454911721, "3": 0.06836337848491023, "2": 0.012276787435203418, "1": 0.011423227459671635}, "score": 4.570166837391031}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.39864399638961484, "4": 0.26889306669308344, "3": 0.20719558018039946, "2": 0.0659306596894477, "1": 0.058874954468774686}, "score": 3.8829081671391488}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.33366018970398487, "4": 0.22471110040718145, "2": 0.2168358203603778, "1": 0.1395124547979997, "5": 0.08509068575334118}, "score": 2.8990125796977826}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6501337292147494, "4": 0.2330705456994791, "3": 0.08996181288238278, "2": 0.016516952521013314, "1": 0.01023130644437436}, "score": 4.496486617643643}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4150607682305427, "4": 0.3572932520790467, "3": 0.16586264050543123, "2": 0.038686862765535755, "1": 0.02294640499141455}, "score": 4.10300064467363}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5731220403737549, "4": 0.3276169134428472, "3": 0.07902919798907744, "2": 0.012929487803690019, "1": 0.00723841296747874}, "score": 4.4465471834165555}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.373081830007954, "5": 0.26541737287868433, "3": 0.22732162819742813, "2": 0.08258474506124863, "1": 0.05141259487803092}, "score": 3.718637310034681}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3298160843611242, "1": 0.24471172349897571, "2": 0.23162831095864705, "4": 0.11324247078089529, "5": 0.08053744881983446}, "score": 2.5532370347985918}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7187277815316501, "4": 0.23538853256963818, "3": 0.039297168934178076, "2": 0.004096690607952827, "1": 0.0024563494367767923}, "score": 4.663890408077185}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32509396999458084, "4": 0.2727355867077018, "5": 0.24702192033409412, "2": 0.10107676513415731, "1": 0.05396542582356604}, "score": 3.557831125897171}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.48294850302965214, "4": 0.24831104623571057, "3": 0.1856432421583563, "2": 0.05079242244461045, "1": 0.03223443461013573}, "score": 4.099024078646269}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3204099850332386, "4": 0.2865958338946198, "2": 0.15303517225337418, "5": 0.12575993086990303, "1": 0.11415375628242466}, "score": 3.1567801163523397}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6180637818332424, "2": 0.18417227172786993, "3": 0.11280387360927985, "4": 0.05080184531291795, "5": 0.03407637670549958}, "score": 1.6985482384471542}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.34662114383433723, "1": 0.26999981639567827, "3": 0.19644721690817707, "4": 0.09398962266379708, "2": 0.09284678662698662}, "score": 3.154400222790752}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.35966112870299877, "5": 0.2497741923196379, "3": 0.20974407121369681, "2": 0.11663778511161911, "4": 0.06406661996939078}, "score": 2.7276233111891166}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5140121374961676, "2": 0.22874370370321706, "3": 0.1811545580886206, "4": 0.041751988503213655, "5": 0.03428455903759336}, "score": 1.8534923020136789}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.39276383755143596, "3": 0.1969538778980474, "2": 0.1766813767407673, "5": 0.12353560066010853, "4": 0.10988615540333077}, "score": 2.3946398535525257}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3077629916073448, "3": 0.3020170518867787, "5": 0.19359270221898717, "2": 0.12098097223588818, "1": 0.0755197475480042}, "score": 3.4229814504610334}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3723768499444889, "3": 0.32182550186602327, "5": 0.2008408651835551, "2": 0.08033807588413873, "1": 0.024466846057652855}, "score": 3.644884745195809}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.30829027146645416, "3": 0.305343776820639, "1": 0.24050738092269283, "4": 0.10880288808649141, "5": 0.03699255510360977}, "score": 2.393444674599843}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4634693840441766, "4": 0.3986510524507969, "3": 0.11204008163127903, "2": 0.017535997689045252, "1": 0.008215086483809446}, "score": 4.2917378365373935}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3271849734408156, "4": 0.325060129473734, "2": 0.14873568120447786, "5": 0.11411229175525468, "1": 0.08476596270125597}, "score": 3.235050239393819}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.38101704779031026, "3": 0.2703593713461365, "5": 0.21998137396707038, "2": 0.07927559127936877, "1": 0.04925084766697367}, "score": 3.6432769799684777}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6599356557514051, "4": 0.2669179689992285, "3": 0.06132027134028342, "2": 0.0069687319532030275, "1": 0.004818673482002411}, "score": 4.570243967629994}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8832508326780434, "4": 0.10354072141833107, "3": 0.012255276500454455, "2": 0.0004968975450000605, "1": 0.0004236851285315603}, "score": 4.868759015717161}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6759714213109966, "4": 0.26222572508838876, "3": 0.05282452539486392, "2": 0.005427228394135843, "1": 0.0035122117912567276}, "score": 4.601779205756095}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6260579626974364, "4": 0.2860251313985221, "3": 0.07275567275185411, "2": 0.008587273477049321, "1": 0.006532653911233415}, "score": 4.516551117796299}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.27254103201839636, "3": 0.22823052186363496, "4": 0.2110746957201083, "5": 0.149126968248854, "2": 0.13885296659378313}, "score": 2.825363247003056}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5572898652609775, "4": 0.32207230788441377, "3": 0.09379259224710706, "1": 0.014638049649298004, "2": 0.011937566529965395}, "score": 4.395814709946014}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3696714650819979, "3": 0.3123413558466569, "5": 0.14551565553211362, "2": 0.10550698708132558, "1": 0.0667404542112212}, "score": 3.421809400640625}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.504394928228707, "4": 0.33682461983938605, "3": 0.1166027990242611, "2": 0.02094472194823947, "1": 0.020867643031330492}, "score": 4.2834032800109405}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.319988506826677, "5": 0.31160154709333615, "3": 0.19134337311133479, "1": 0.10771682349592909, "2": 0.06918864634350924}, "score": 3.6586754223496585}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4002330005849113, "3": 0.23063061905915816, "5": 0.13864487100437578, "2": 0.1152826892014573, "1": 0.11505160639692734}, "score": 3.3321890652880666}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7210958573352498, "4": 0.24725200482963883, "3": 0.027681969453140977, "2": 0.002158156271069381, "1": 0.001737676331359703}, "score": 4.683935387216056}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6754218097142415, "4": 0.2755058545444212, "3": 0.042993041584487426, "2": 0.0035745678187645616, "1": 0.002399448163359929}, "score": 4.6181463653232}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.794331959575933, "4": 0.18361948113956306, "3": 0.018563084030344207, "1": 0.0017003305595979096, "2": 0.001665431549907162}, "score": 4.767428892092951}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3166377509545597, "3": 0.22240930020756006, "5": 0.21718716188776413, "1": 0.12727828108917466, "2": 0.11641701236800547}, "score": 3.380065292313733}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3134989086799217, "4": 0.25972775310622526, "3": 0.23858474662693593, "1": 0.10508051638170578, "2": 0.0827730296100063}, "score": 3.59399052200064}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.45863414796613994, "4": 0.2939611979839394, "3": 0.166378976787176, "2": 0.04118011437276992, "1": 0.039719779149675144}, "score": 4.09074701948393}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5009353841337681, "4": 0.3041695508475609, "3": 0.14321548425913921, "2": 0.029297356173989396, "1": 0.022167001828944204}, "score": 4.232674258835193}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.23403846424909303, "4": 0.2261746930966405, "5": 0.19854025568405886, "3": 0.1978586682260478, "2": 0.14322538079102273}, "score": 3.011954838290495}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28059489630106066, "2": 0.223403617399615, "1": 0.20868275476695813, "4": 0.20391123548535492, "5": 0.082838081651164}, "score": 2.728663769098161}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3408165237569595, "2": 0.2330687976769414, "1": 0.17241360647464818, "4": 0.17167330462768512, "5": 0.08190446269886392}, "score": 2.7575563249388195}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.899691654924492, "4": 0.08163207649107586, "3": 0.016763449293529055, "2": 0.0010065428907820204, "1": 0.0008460450070080495}, "score": 4.878429893884636}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.41294779432654904, "3": 0.2534130785889952, "4": 0.24892102537356828, "2": 0.05122988632234558, "1": 0.03333795637596339}, "score": 3.957054621034734}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.734921932276695, "4": 0.22108063052483407, "3": 0.03857916172375296, "2": 0.003388311040104474, "1": 0.001955972043814548}, "score": 4.6837488245515235}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.867205366507551, "4": 0.11813585537925715, "3": 0.012776131185528493, "1": 0.0009393807278161646, "2": 0.00088128736917435}, "score": 4.849901194282435}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4183096630649762, "5": 0.2575819131870918, "3": 0.2521915906450262, "2": 0.04833196673875433, "1": 0.02343475036251063}, "score": 3.8383978789127515}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.37714573546931407, "4": 0.2956408221953332, "2": 0.1271455227603749, "5": 0.11602462800761083, "1": 0.0838464105181104}, "score": 3.2328975875353625}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6485505559343506, "4": 0.24671385393771536, "3": 0.08918765016914092, "2": 0.008665159054593011, "1": 0.0067281261936471635}, "score": 4.521928927842348}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7391003319973614, "4": 0.21893230643157505, "3": 0.036080879777786845, "2": 0.0032759774382372367, "1": 0.002458409457846834}, "score": 4.689197092330463}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4309874101904679, "4": 0.378410134370498, "3": 0.14654016855777874, "2": 0.02633601987018971, "1": 0.017508876466350885}, "score": 4.179287547910958}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31986181646432105, "2": 0.2767085756716561, "4": 0.19622025513461105, "1": 0.16079366818042046, "5": 0.04629964894963547}, "score": 2.6904877265592284}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9524542763171621, "4": 0.04239163177585597, "3": 0.004557064558110971, "1": 0.0003059374159404544, "2": 0.0002762918012050897}, "score": 4.946440821464766}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.38066100141214376, "4": 0.3253147837579961, "3": 0.22224691176616654, "2": 0.04116246424131431, "1": 0.030575464664307984}, "score": 3.984362151443304}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9238313552146373, "4": 0.06771549146877576, "3": 0.007646066090076357, "2": 0.00039978142408357017, "1": 0.00039231377183466826}, "score": 4.914222491012442}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2785460731733196, "2": 0.2393548979035383, "4": 0.21341720929430127, "1": 0.20425758705659422, "5": 0.06436671675784172}, "score": 2.6942629860799086}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"2": 0.37469628043994274, "1": 0.3714585707074836, "3": 0.2039828412897972, "4": 0.037748078697982544, "5": 0.012038529272616125}, "score": 1.9441317865951564}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8736561777731795, "4": 0.11155465821371446, "3": 0.012985608152009467, "2": 0.0009619189138387556, "1": 0.0007682467402865803}, "score": 4.856504850640894}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7095663998069348, "4": 0.19561238605435266, "3": 0.07755231795447708, "2": 0.008987150895745923, "1": 0.008158989120270188}, "score": 4.589635194057225}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7024028915487999, "4": 0.24437452303972804, "3": 0.04662590458124645, "2": 0.004370748513449243, "1": 0.002123237356729692}, "score": 4.640731577774247}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.849579600069813, "4": 0.12696703412976867, "3": 0.020102365183879523, "2": 0.0017495873829830558, "1": 0.0015406693717685822}, "score": 4.821405947374001}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2963344689252453, "3": 0.28244845647452665, "5": 0.20056118834801437, "2": 0.12179089258794577, "1": 0.09873260920760932}, "score": 3.3782508091459595}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8392473254168942, "4": 0.130721535690645, "3": 0.02675822704073914, "2": 0.0017333829802866248, "1": 0.0014760666470431312}, "score": 4.804645197048503}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4135091651299247, "4": 0.3995640624743074, "3": 0.157018946903684, "2": 0.020546608256651416, "1": 0.009219190901336912}, "score": 4.187766096739314}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9563640528493859, "4": 0.039727493479823225, "3": 0.0032978039557049173, "1": 0.0002943246936078385, "2": 0.00018918371083600474}, "score": 4.951925936502387}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.535506098894746, "4": 0.3325115442300711, "3": 0.09916321004114714, "2": 0.01741047922036279, "1": 0.015245589970686984}, "score": 4.355843190569602}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3647928575711811, "4": 0.25714110450250854, "2": 0.20511128366204612, "1": 0.09817010889785288, "5": 0.07458522855685229}, "score": 3.0048610295294615}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.41082573780735343, "5": 0.38211307741642186, "3": 0.1781195010026195, "2": 0.02098715699524374, "1": 0.00791020168544356}, "score": 4.138294787296281}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4718469237909337, "4": 0.30609349024994037, "3": 0.18816015321345836, "2": 0.022514960041057432, "1": 0.01131672000954776}, "score": 4.204720560836448}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.49021833768974377, "4": 0.30289853425498203, "3": 0.16497168926751518, "2": 0.027744140895043616, "1": 0.014075902306181935}, "score": 4.227551456912466}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4036902915851915, "5": 0.27989274577476436, "3": 0.2486949833171679, "2": 0.04849966443153781, "1": 0.01916120915753175}, "score": 3.8767072722293223}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7395317598637213, "2": 0.16805408783421, "3": 0.06499137566282073, "4": 0.020585418368856537, "5": 0.006756238356131737}, "score": 1.3868494288834503}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.45262912383823806, "2": 0.3330292350208017, "3": 0.16291338496351637, "4": 0.038173451190640764, "5": 0.013200094372282863}, "score": 1.8262219391189074}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3289666174770365, "3": 0.29687419968344436, "5": 0.2385282803004627, "2": 0.08332409632763817, "1": 0.05215114196897191}, "score": 3.6184930750683693}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3192598598914402, "3": 0.29018808420664244, "5": 0.17023848024516824, "2": 0.1256050272340804, "1": 0.09457557770965684}, "score": 3.3450265161502437}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29218065105892393, "4": 0.2715352265887044, "5": 0.15897528962547594, "1": 0.1394888512875612, "2": 0.1376850704455808}, "score": 3.172846351692027}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2872990843754665, "2": 0.2436527799874667, "4": 0.22730219302908256, "1": 0.18679296770777787, "5": 0.054828332621266636}, "score": 2.7196852037935733}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5559833451201963, "4": 0.3557315875723306, "3": 0.07104894309925393, "2": 0.010171600567869888, "1": 0.006988178802219234}, "score": 4.4436605356703245}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3173171919044227, "2": 0.25552945301343766, "1": 0.21072348554564274, "4": 0.145796378286608, "5": 0.07056656007646243}, "score": 2.6099269662889415}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8677152336334446, "4": 0.11970821965246348, "3": 0.011095147815204792, "2": 0.0007754554684607424, "1": 0.000598544908915102}, "score": 4.853365190314322}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.39397372883147075, "4": 0.3290034638015495, "3": 0.16539389625595288, "2": 0.056383636249293684, "1": 0.05517235314434995}, "score": 3.9502918758420993}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31544649479122444, "4": 0.22922775645778212, "2": 0.1616662425691197, "1": 0.15350164429388166, "5": 0.13993956893849815}, "score": 3.040446192296507}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5571697655193313, "4": 0.32376734244674443, "3": 0.08818177235224708, "1": 0.01650285306488504, "2": 0.01432636690487413}, "score": 4.390846985008606}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2903612620715006, "4": 0.2748251779539747, "5": 0.20504067600288728, "2": 0.1207366682997854, "1": 0.10889398333702163}, "score": 3.3464311686999024}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.86640658752014, "4": 0.1126116618287974, "3": 0.017120135390092772, "1": 0.0019798157384402233, "2": 0.0018196356322445055}, "score": 4.839759936394789}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6200961390376915, "4": 0.2856072110674057, "3": 0.06573697016226823, "1": 0.015321798898346135, "2": 0.013150401348837102}, "score": 4.482135146417237}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.34385841177981114, "3": 0.25713606458625166, "5": 0.1927789660515937, "2": 0.12406616090274696, "1": 0.08206907567874137}, "score": 3.4412523272269206}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.43955611096764885, "4": 0.39615869621025396, "3": 0.12997837350751767, "2": 0.02316791341622175, "1": 0.011081790646784304}, "score": 4.230009675747829}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6127950550645185, "4": 0.30164655339555757, "3": 0.0720134191679169, "2": 0.00865181632770135, "1": 0.004842234457573908}, "score": 4.508977217796017}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8921552450586756, "4": 0.09908854843243571, "3": 0.008081077996013208, "2": 0.00040052394719398363, "1": 0.00024222463949515524}, "score": 4.882575022963886}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4908547106332879, "4": 0.35291339220949625, "3": 0.12522031163101566, "2": 0.020488182960396624, "1": 0.010463460953257776}, "score": 4.293285230211341}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6846663908567957, "2": 0.23416705689224115, "3": 0.05281333306380213, "4": 0.018058019486341417, "5": 0.010256250032059733}, "score": 1.4350097250918081}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.47100319572969523, "4": 0.24502111217675404, "3": 0.18351862830343588, "2": 0.06022600157905874, "1": 0.0400804618126581}, "score": 4.046798226661747}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.39505151692119395, "4": 0.2659829154219919, "3": 0.2494801814529112, "2": 0.05911292389797518, "1": 0.030184787701604755}, "score": 3.9367792596400863}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8489919028461131, "4": 0.11985906317215958, "3": 0.024399242310829173, "1": 0.003523205677415584, "2": 0.003124168847405482}, "score": 4.807857444262106}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9067819642436215, "4": 0.07507910409551359, "3": 0.014087722578852135, "1": 0.0021644348302286075, "2": 0.0018187860607946202}, "score": 4.8826233730189506}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.27272391387439116, "3": 0.2366025144651566, "5": 0.18917102101085992, "1": 0.157449296426029, "2": 0.1437576188519425}, "score": 3.1924666441399756}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8693957750978866, "4": 0.10543207207761497, "3": 0.02003765150504132, "1": 0.003143080214050531, "2": 0.0019517917151280278}, "score": 4.836058432006336}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7775562113389743, "4": 0.1715943702272435, "3": 0.039321273347826445, "1": 0.0059573710155124545, "2": 0.005381174069958626}, "score": 4.709735042569108}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8111566880613071, "4": 0.16276007419394284, "3": 0.022102556464982187, "2": 0.002163997658548726, "1": 0.0016817489254605741}, "score": 4.7797861097043155}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6978394130171371, "4": 0.2092502238165463, "3": 0.06369477148952646, "1": 0.015371706494131157, "2": 0.013714398673419902}, "score": 4.5606733243299695}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6386602539231444, "2": 0.2695709117142404, "3": 0.0688673836388351, "4": 0.016650778614757014, "5": 0.006118344656552177}, "score": 1.4817951481869627}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4309319456799942, "5": 0.3345977215254395, "3": 0.1799055838274694, "2": 0.03528666318106421, "1": 0.019186672146975767}, "score": 4.026561222952962}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5644877478819854, "4": 0.3168585877692934, "3": 0.09600314765297448, "2": 0.013808236735233187, "1": 0.008784035085254296}, "score": 4.414540166343062}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5324026366968616, "4": 0.332386443675123, "3": 0.10689094177947453, "2": 0.01622184481028621, "1": 0.012055303396210046}, "score": 4.356917381751884}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30454171687027043, "2": 0.23754811180550836, "4": 0.2219079328545675, "1": 0.16910289553721275, "5": 0.06680763557211976}, "score": 2.779749102490454}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"4": 0.40168758268763427, "3": 0.23744157162130242, "5": 0.21289363589302884, "2": 0.08041753737730221, "1": 0.06749680605006425}, "score": 3.6121021856391504}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4426857405279927, "5": 0.25085008229182637, "3": 0.23259124019252853, "2": 0.0487793505568843, "1": 0.024953908892945312}, "score": 3.8458168783878923}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3688671230237124, "5": 0.28673589883413897, "3": 0.2758932675038239, "2": 0.046109466637810806, "1": 0.022300272073167936}, "score": 3.8517089466390972}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.471103793913667, "5": 0.2798367168557422, "3": 0.20519305731612036, "2": 0.02973383666537156, "1": 0.014064062416723448}, "score": 3.9729819473350343}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4345249993623752, "3": 0.25772168928583455, "5": 0.2063707232819122, "2": 0.06342662201977427, "1": 0.03788698612009987}, "score": 3.7081146973684853}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"1": 0.40666480817291084, "2": 0.2675838777805107, "3": 0.16551749165358984, "4": 0.11908119590674474, "5": 0.04081456810117212}, "score": 2.119499177296579}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6084598321442707, "4": 0.3012496668710875, "3": 0.07591852903999106, "2": 0.008184951448025736, "1": 0.006048088544002614}, "score": 4.498096336072785}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.564676069821756, "4": 0.28923684315797604, "3": 0.12051688637227971, "2": 0.01594756700911438, "1": 0.009508605959244203}, "score": 4.383781993323698}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5504170034192335, "4": 0.3299906362249831, "3": 0.0960999964448661, "2": 0.013897957390048158, "1": 0.009515222446496935}, "score": 4.3980069406659705}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5272788200740002, "4": 0.3335408941514629, "3": 0.1096026857226231, "2": 0.016987673264972667, "1": 0.012457685964565078}, "score": 4.346373534648809}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5110504835593426, "2": 0.34207587835266845, "3": 0.10980193797685892, "4": 0.03008570009541668, "5": 0.006912686032627347}, "score": 1.6796374256498743}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.39688937084007764, "5": 0.273230286249803, "3": 0.2725474095531625, "2": 0.0462686524550686, "1": 0.010999941768175562}, "score": 3.875137712950594}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3635521958072124, "3": 0.33855459992719056, "5": 0.13120810873491323, "2": 0.1127407887688578, "1": 0.05382993790224688}, "score": 3.405614138330117}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.39003861185604616, "5": 0.35635419962170384, "3": 0.18690107739200917, "2": 0.04143338177446303, "1": 0.025180132204561324}, "score": 4.011046984986423}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.29092732071448907, "3": 0.28868642919980303, "5": 0.22149685239593828, "2": 0.11873433031694136, "1": 0.08004355139488482}, "score": 3.455150348935927}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3114581499066035, "4": 0.2796481424910402, "3": 0.2521687683387978, "2": 0.09674045580002916, "1": 0.05989247546690686}, "score": 3.6861021624558505}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9622106561514961, "4": 0.032472506549146525, "3": 0.004586732876343165, "1": 0.0004136540340701818, "2": 0.0002719093008590717}, "score": 4.955881718583051}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5170907748010889, "4": 0.24345869043234927, "3": 0.17040822448408552, "2": 0.039603776464639744, "1": 0.029354218858167413}, "score": 4.179427469233054}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.966554164500255, "4": 0.028652201430856068, "3": 0.004130875124101856, "1": 0.0003434498342182304, "2": 0.00026591283256794404}, "score": 4.960912423355254}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.841905924166812, "4": 0.12880128353856604, "3": 0.023345850953814157, "1": 0.003196790312144375, "2": 0.0027011491105833753}, "score": 4.803606782329114}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4074653013451274, "5": 0.3116669591228234, "3": 0.20019673918917952, "2": 0.04902346587976293, "1": 0.03146028884666009}, "score": 3.9190272598434914}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.35874939439761605, "3": 0.3033247697898194, "5": 0.1629698768263818, "2": 0.10789499428099417, "1": 0.06696669317404458}, "score": 3.442902520520053}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4296337402991955, "2": 0.26867747403928144, "4": 0.1527783195619958, "1": 0.11612192062044453, "5": 0.032749257136928944}, "score": 2.7173444134862885}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8125883111812773, "4": 0.15056478835766338, "3": 0.031424884497807844, "1": 0.0027123593879581406, "2": 0.0026905947853877177}, "score": 4.767659791918492}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.35892138419641345, "3": 0.31052756667110487, "5": 0.1370479656768781, "2": 0.12063360320011887, "1": 0.07280450091027757}, "score": 3.366798544858763}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32476903851740246, "2": 0.2661057214772076, "1": 0.24670489838736165, "4": 0.11231812861889458, "5": 0.050025635247113155}, "score": 2.452811978432566}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6313055009250486, "4": 0.2538454910519451, "3": 0.09202937126527783, "2": 0.013127342634410252, "1": 0.00962727945840565}, "score": 4.484171084236535}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3483281095050521, "2": 0.2213901387774802, "1": 0.17939151984715768, "4": 0.16031186574361275, "5": 0.09049927856187678}, "score": 2.761118351827737}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8656982606030335, "4": 0.11040598882579217, "3": 0.021229611563911385, "2": 0.0015571921240573182, "1": 0.0010609775275686503}, "score": 4.838211540675795}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.37519605736286027, "5": 0.3045653806809984, "3": 0.19114405892853975, "2": 0.0698306607432584, "1": 0.059155754898128715}, "score": 3.796270715005645}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2890529470109011, "3": 0.2554895679789302, "5": 0.19059919714913484, "2": 0.13442518231892234, "1": 0.13031992372220774}, "score": 3.2752174611589564}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.38460755585946055, "4": 0.3403659897082489, "3": 0.17928468814176737, "2": 0.05083415539645503, "1": 0.044728727965654455}, "score": 3.9694629104638186}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3391652931575588, "4": 0.25750416094479217, "3": 0.20665366559525147, "1": 0.10230837932946618, "2": 0.09427139271511599}, "score": 3.6370084546671078}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5163835374353977, "4": 0.24842981697384067, "3": 0.15073606280806026, "2": 0.04246900343857334, "1": 0.041845366710151335}, "score": 4.155194507072323}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3601310449568111, "5": 0.298120950696848, "3": 0.23352519644673614, "2": 0.0654477607729926, "1": 0.04265099823682759}, "score": 3.805723138164623}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.38885589261579245, "5": 0.3658987950775414, "3": 0.16490462541366444, "2": 0.04474720027077644, "1": 0.0355028252911976}, "score": 4.00499174580705}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5476916680086877, "4": 0.3040889565957963, "3": 0.12766748098721606, "2": 0.014416945405121093, "1": 0.00605644793556646}, "score": 4.373050237246427}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.81643566770024, "4": 0.13502450479715028, "3": 0.0424374522011099, "2": 0.0035996613765990676, "1": 0.0024766196325399174}, "score": 4.759388849562968}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3767211576799836, "5": 0.353646447780464, "3": 0.2042201909161253, "2": 0.04045852919416716, "1": 0.024892328882126055}, "score": 3.993831833440074}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2816941981946634, "4": 0.22199762397110356, "2": 0.19993139425638184, "1": 0.19908850587306967, "5": 0.09720340862229589}, "score": 2.8182806128555176}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8670945620852639, "2": 0.10516683342631984, "3": 0.020272357913496335, "4": 0.004514461808470019, "5": 0.0028987162859784605}, "score": 1.1708588670430855}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5875491364209297, "2": 0.2647336904464237, "3": 0.11244369179680751, "4": 0.02707025649910016, "5": 0.008088204606858952}, "score": 1.6032540483840962}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.49413402150297686, "2": 0.31520337927681435, "3": 0.14899238227720218, "4": 0.030069557432446565, "5": 0.011497369602420319}, "score": 1.7494637065756462}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2838262567604517, "1": 0.21727331539928085, "2": 0.2021019511985337, "4": 0.18727845603249135, "5": 0.10931649284352127}, "score": 2.769215888747911}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.38628837614130074, "2": 0.29912743271981285, "3": 0.2091263425188748, "4": 0.07390378754802482, "5": 0.031433889017052255}, "score": 2.0649550143023276}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.37407081296928396, "5": 0.3382872474113964, "3": 0.22062075329523773, "2": 0.04154459709294314, "1": 0.025292400597742185}, "score": 3.958692489763186}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.48837361087149656, "4": 0.3684377904211385, "3": 0.11918995476591607, "2": 0.01677234298543293, "1": 0.007126198189632054}, "score": 4.314291837048159}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.53450513577703, "4": 0.3224977240437159, "3": 0.12010177147559803, "2": 0.014961988412413129, "1": 0.007829087615270493}, "score": 4.361029777392385}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.45585408942645905, "5": 0.37874544826990497, "3": 0.1362634683566661, "2": 0.020581379905958732, "1": 0.00841408492977801}, "score": 4.176101888855803}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.43269620599542, "5": 0.344327307046774, "3": 0.1796134926180786, "2": 0.031340816168607885, "1": 0.011970515432261715}, "score": 4.066124051944322}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4091822185613391, "3": 0.2264274713792179, "5": 0.21006846029223095, "2": 0.08885701270802737, "1": 0.06527158388290362}, "score": 3.6100368502309226}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6925759997576111, "4": 0.2433587711497627, "3": 0.05228064776503431, "2": 0.006319071475819023, "1": 0.005348470750299927}, "score": 4.611683387664116}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.41163531886240123, "5": 0.2953299420534766, "3": 0.18969193830851358, "2": 0.056039358766715716, "1": 0.04715145553837697}, "score": 3.852082438128244}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7563261125554519, "4": 0.20474696076453108, "3": 0.03337738847594638, "2": 0.0030148596514077324, "1": 0.002380564344188939}, "score": 4.709886715373369}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5268126481525691, "4": 0.34514702269118136, "3": 0.10439055259639246, "2": 0.014554879219975269, "1": 0.008945768068755409}, "score": 4.366529693215956}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3108852829384702, "2": 0.22162440484631257, "3": 0.21565221169365004, "4": 0.1740465825138839, "5": 0.0775753776862642}, "score": 2.4856912042947465}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.36223507480377004, "5": 0.3068753929332365, "3": 0.1951042788539046, "2": 0.06856045281922088, "1": 0.06695539015023885}, "score": 3.773723076624769}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4085559784177543, "3": 0.25281790309805685, "5": 0.23697915388658833, "2": 0.06172155854146623, "1": 0.03970862740146865}, "score": 3.7415362220711343}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3945891823446048, "5": 0.39044533761497685, "3": 0.15645906010460828, "2": 0.034417906921443336, "1": 0.023915779685949334}, "score": 4.093419261229565}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4068047045909893, "4": 0.3654337042373014, "3": 0.1655365272596564, "2": 0.03644513499792246, "1": 0.025684990112892638}, "score": 4.09133160791018}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3095307927141018, "3": 0.2557827570615867, "2": 0.15065801681288687, "5": 0.1468800370299151, "1": 0.1370143519337917}, "score": 3.1786280901971593}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6207170419016088, "4": 0.27960944186626446, "3": 0.081661567322828, "2": 0.012270564681575113, "1": 0.005662951818554177}, "score": 4.497564514943593}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7267077694525156, "4": 0.21244462772183492, "3": 0.0552429250598043, "2": 0.003671059376950167, "1": 0.0018424212051470785}, "score": 4.658655529552725}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9349401382547295, "4": 0.05863483529856855, "3": 0.005826423102074698, "2": 0.0002740415008744871, "1": 0.00024949841387683045}, "score": 4.927886787274065}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7691147045012687, "4": 0.17522254977512133, "3": 0.04417688457999498, "2": 0.006281769315787848, "1": 0.005045752897189982}, "score": 4.697347439846036}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3172954881507733, "5": 0.28130989166261516, "3": 0.26451632747628406, "2": 0.07802729325284367, "1": 0.05872915484894506}, "score": 3.684513072752659}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.41231650852121765, "4": 0.3503218414580643, "3": 0.15056784485389038, "1": 0.04443626338462419, "2": 0.04231242926666089}, "score": 4.04381699167485}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5679519834579214, "4": 0.31221619451523985, "3": 0.1048623543261359, "2": 0.009510831233385586, "1": 0.005427693527539901}, "score": 4.4277981234139645}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5111567215537876, "4": 0.27345379802520486, "3": 0.12971974024154062, "1": 0.04540314060526426, "2": 0.040131227784225655}, "score": 4.164987438572886}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3048722934677541, "5": 0.2886858229589383, "3": 0.20298572958950223, "1": 0.10855844363588808, "2": 0.0947468766195886}, "score": 3.5704662210412716}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7698426235683746, "2": 0.15962261595927668, "3": 0.050032324121686976, "4": 0.014654101746656144, "5": 0.0056043567087955635}, "score": 1.3261465688311946}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6860415943027334, "4": 0.2263555241618319, "3": 0.07710603704397337, "2": 0.0067184184624193115, "1": 0.003686864172426964}, "score": 4.58449164495683}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3246710704777036, "5": 0.2828738331510753, "3": 0.27769052633428726, "2": 0.07648099502955082, "1": 0.03819491833875005}, "score": 3.737613299410668}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.31899335727609995, "4": 0.2582473841944498, "3": 0.23075087814368067, "2": 0.09664496208843754, "1": 0.09521416083308974}, "score": 3.609251750363377}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.25621216710379935, "3": 0.22952782844307087, "2": 0.21996228041248228, "4": 0.18438824816780697, "5": 0.10973174208505138}, "score": 2.6714067155887484}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5309805220772945, "4": 0.24810582751179394, "3": 0.18330500858264365, "2": 0.02341681324226091, "1": 0.014113008757828635}, "score": 4.258523237493803}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.397335129293973, "3": 0.26203806487278697, "5": 0.24526824250505222, "2": 0.06575256482104413, "1": 0.029449530832386935}, "score": 3.7633394257632586}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6937752209914738, "4": 0.25920531741398317, "3": 0.04495446906414879, "2": 0.0013635223011501877, "1": 0.0006451225236894615}, "score": 4.644194638643775}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.833825609339125, "4": 0.14029538306585093, "3": 0.02372610880159324, "2": 0.001184246703242558, "1": 0.000933135628047108}, "score": 4.804960189585004}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9552633761299612, "4": 0.040450612234703615, "3": 0.00380851473188322, "1": 0.00025434269687584936, "2": 0.00016869385410311688}, "score": 4.950406205056163}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.367931131864113, "2": 0.24522355870208587, "3": 0.22313765744776476, "4": 0.12546144233578743, "5": 0.03811192704643187}, "score": 2.2204948000103957}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8759453200747048, "4": 0.10447975065397315, "3": 0.017577236407869744, "2": 0.0012791987162524866, "1": 0.0006528324804244388}, "score": 4.853907257766872}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7337359325623279, "4": 0.1897742445222789, "3": 0.06438788401401793, "2": 0.007204017661841, "1": 0.004817693463487433}, "score": 4.640538321799197}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4169654976728805, "5": 0.3920915188447634, "3": 0.15011028825801873, "2": 0.02538174662783971, "1": 0.015325108764360837}, "score": 4.1452606906189065}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.29667877237445606, "3": 0.29570424395343453, "2": 0.14459713250306294, "1": 0.13279460071936877, "5": 0.13004617490698014}, "score": 3.146611042698652}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4262977385744357, "2": 0.21623547566082696, "4": 0.19551348987873057, "1": 0.09290881041853512, "5": 0.06892804118092277}, "score": 2.9313084770072924}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5736528824476133, "4": 0.33150933827311285, "3": 0.07736068292449229, "2": 0.011142206434019438, "1": 0.006181825888104734}, "score": 4.455532034560982}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3976955962002115, "3": 0.2794298225567862, "5": 0.21591920331548375, "2": 0.07436052915722732, "1": 0.03246731136372457}, "score": 3.690326893448176}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9074231768820008, "4": 0.0844408660212513, "3": 0.0074894066765844565, "2": 0.00038257015873038766, "1": 0.00020975235185959225}, "score": 4.898588101386682}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.401606213042874, "4": 0.33827280285432537, "3": 0.1757411509099923, "2": 0.048636524374193614, "1": 0.03564777665447671}, "score": 4.021650751764235}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.39337797927522444, "5": 0.2571224367359698, "3": 0.21711678293412176, "2": 0.07606514004089368, "1": 0.056112274140576734}, "score": 3.7194809363649735}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6378461748236408, "4": 0.29362630252428756, "3": 0.05756557765941333, "2": 0.00625928698823599, "1": 0.004631950153979609}, "score": 4.553905338181628}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4404336540702497, "3": 0.2682184013329221, "5": 0.23132854643537712, "2": 0.0429013922583577, "1": 0.017060149052482508}, "score": 3.8261168530970378}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8910527322869658, "4": 0.10228676385266945, "3": 0.005886439283691143, "2": 0.0003301701269944956, "1": 0.00032540109438039636}, "score": 4.883634454277489}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5085303397915362, "5": 0.32698443781407704, "3": 0.13303028099774628, "2": 0.020648539261892945, "1": 0.010648315162989603}, "score": 4.12073121883636}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.39518969059492004, "3": 0.2988179362244863, "2": 0.12263205863262117, "5": 0.11671006460575745, "1": 0.0663991382995747}, "score": 3.373273217825546}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9104985066123037, "4": 0.07985507098105397, "3": 0.008348156023634456, "1": 0.0006862064692083906, "2": 0.0005482636355123477}, "score": 4.899052560117339}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9233899062859678, "4": 0.06396972848119645, "3": 0.011488715341847727, "1": 0.0005802636434682418, "2": 0.0005332839161053142}, "score": 4.909128472095847}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9754317241389032, "4": 0.023405926955361117, "3": 0.0010433808719154342, "1": 4.413193005375757e-05, "2": 0}, "score": 4.97432886245268}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9082998042377273, "4": 0.0832966788793253, "3": 0.0074870830742182655, "1": 0.0004234271828407198, "2": 0.00037189563281630746}, "score": 4.898907515931289}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3081861177814817, "5": 0.28099871011415845, "3": 0.27086129925215147, "2": 0.08627788249573531, "1": 0.05353091186866525}, "score": 3.676942041504448}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6227763708073447, "4": 0.18940392028536351, "3": 0.12283303313159523, "1": 0.033484872811491394, "2": 0.031414695060071836}, "score": 4.33668865736442}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5107169020639729, "4": 0.28126302933840414, "3": 0.1566841474033995, "2": 0.028319915327762003, "1": 0.022939682679618836}, "score": 4.228591322784432}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.41298570467412654, "4": 0.2926804147179928, "3": 0.18021579230414325, "2": 0.0642043893940214, "1": 0.04973211388101178}, "score": 3.9551566490577366}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6267784625820011, "4": 0.2502800470155966, "3": 0.08701023705073269, "2": 0.017994142332872783, "1": 0.017864710366156188}, "score": 4.45021840587347}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3110872063000073, "3": 0.24322133660198295, "2": 0.2195289861132018, "4": 0.14307437200041662, "5": 0.08276876690874686}, "score": 2.466738219513469}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2564430157170205, "5": 0.2564215010505548, "3": 0.21084049062422422, "1": 0.15107862232859245, "2": 0.12492099268912624}, "score": 3.342308890847198}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5210683269761964, "4": 0.2589259928516789, "3": 0.14721704272610162, "1": 0.04178116245499964, "2": 0.03080385606264362}, "score": 4.186938148905362}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5600796910113395, "4": 0.22422008212208996, "3": 0.11966161434637282, "1": 0.06005807309151401, "2": 0.035823685435341514}, "score": 4.188626073272583}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.24462829102730746, "4": 0.22454606579460082, "3": 0.22174808359875636, "1": 0.2011394158834097, "2": 0.107773335788906}, "score": 3.2037840655188123}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5490774020883081, "4": 0.27101836306787647, "3": 0.13561719564153465, "2": 0.024239532603518247, "1": 0.01998496576210405}, "score": 4.305045321743065}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4591939542019372, "5": 0.33190018594908755, "3": 0.1545877473268974, "2": 0.031117092895184426, "1": 0.022846706675870812}, "score": 4.046554627711737}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7236724254638849, "4": 0.21253074898074478, "3": 0.05397614981907084, "2": 0.004991243010192725, "1": 0.004776415066246378}, "score": 4.645418763018135}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9425550055845608, "4": 0.052092140277520904, "3": 0.004485979556824747, "1": 0.0004415670856880955, "2": 0.0003244617183388766}, "score": 4.936189812123079}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8161435094967034, "4": 0.15737122093932307, "3": 0.022295136911846015, "1": 0.00220773229748229, "2": 0.0019310800909204467}, "score": 4.78340321997042}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6215090727427192, "4": 0.27085203595412033, "3": 0.07498085235306896, "2": 0.018391291765695556, "1": 0.014194646393571346}, "score": 4.467195382834117}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6203782166989523, "4": 0.3033330506690682, "3": 0.06544090220705873, "2": 0.006968430213642164, "1": 0.0038243835044536826}, "score": 4.529556438002544}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3519111676021519, "4": 0.31491308464242457, "3": 0.2595379614959896, "2": 0.04848694948652601, "1": 0.025055480323246625}, "score": 3.920225259127308}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.724981696973449, "4": 0.24128299048207127, "3": 0.030920177953241444, "2": 0.0017817219404777, "1": 0.00098401482004903}, "score": 4.687579995639331}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7271391839848159, "4": 0.22326267185671825, "3": 0.04266963226223231, "2": 0.004547662110223056, "1": 0.0023331212863572214}, "score": 4.668406765695152}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6301322254197333, "2": 0.20862952658576026, "3": 0.11626830320307066, "4": 0.0300075278639204, "5": 0.01481542072170094}, "score": 1.59053720619917}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6097769465979601, "4": 0.265598343027659, "3": 0.09164348434704607, "2": 0.018287692250839444, "1": 0.014533548679619836}, "score": 4.438027509583931}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3487645242914245, "3": 0.23565257463462608, "4": 0.22906852142244036, "2": 0.10057761107618074, "1": 0.0857258898843958}, "score": 3.6547062427557346}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2990304713244165, "4": 0.27797102426120207, "5": 0.1741144739190278, "2": 0.14205795085787498, "1": 0.10670234963183176}, "score": 3.2707708244533578}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2487652744511228, "4": 0.24717188343924618, "5": 0.19402074357317975, "1": 0.163332627170637, "2": 0.14653250470737458}, "score": 3.162044287973119}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5469240141566348, "4": 0.27905069811356736, "3": 0.10891158202666469, "1": 0.038488445485205025, "2": 0.026408334972584786}, "score": 4.269788949763305}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7812221473180103, "4": 0.18147637482555118, "3": 0.03224611848622892, "2": 0.002562125734535676, "1": 0.002473653676641627}, "score": 4.736445235900334}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7386186842782528, "4": 0.2131030771601261, "3": 0.0437145491410839, "2": 0.0026738783365764253, "1": 0.0018100406054604326}, "score": 4.68418083408015}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8117570038085501, "4": 0.1529560735181041, "3": 0.029163014478706797, "2": 0.0030775843243649194, "1": 0.0029427854917556248}, "score": 4.767689949578431}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5428914972051855, "4": 0.3571373990349786, "3": 0.08094102305038117, "2": 0.0113059335291579, "1": 0.007541768314419608}, "score": 4.416789315715939}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"1": 0.352186681076278, "2": 0.2891714541002496, "3": 0.2333328276088112, "4": 0.09070211531746335, "5": 0.03437866879873605}, "score": 2.165724210628234}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.478322895953913, "4": 0.2946260658744042, "3": 0.15141078581416384, "2": 0.043955017392073664, "1": 0.03140952148585097}, "score": 4.144813437914909}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.40037082453204365, "5": 0.31837714766391473, "3": 0.21529248069523285, "2": 0.0438950202182157, "1": 0.021900373226477317}, "score": 3.949585231083775}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.400591345431106, "4": 0.3137058862547368, "3": 0.19316908220590973, "2": 0.05672887151784902, "1": 0.035683852622907866}, "score": 3.9869113790954382}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2515126481127799, "2": 0.23154438406722685, "4": 0.20701378370226475, "1": 0.20543257522041447, "5": 0.10436801710888034}, "score": 2.773311133085155}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"4": 0.389404472691235, "3": 0.2347754390980881, "5": 0.2006827451939621, "1": 0.08773269009235776, "2": 0.08726007079290386}, "score": 3.528120868942436}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3741835225189862, "3": 0.3190510683942444, "5": 0.18808385093046406, "2": 0.07714235482716833, "1": 0.0414708088687863}, "score": 3.5903076255866666}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3025006357078183, "5": 0.2800593875247147, "4": 0.2574026470689075, "2": 0.09724037238462004, "1": 0.06274958591224908}, "score": 3.594810054895259}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.3852467002638631, "4": 0.3346423933030379, "3": 0.18916475955369216, "2": 0.04850709029859792, "1": 0.04228943448066063}, "score": 3.972195296472858}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6387032052694436, "4": 0.2899398764738106, "3": 0.061657746770448704, "2": 0.005590340954644186, "1": 0.004044443561443881}, "score": 4.553767101291229}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.542960910320242, "4": 0.20791627590523162, "3": 0.20112499470429632, "2": 0.033990765302782555, "1": 0.013955586289689714}, "score": 4.231999566573843}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.4717834457760687, "2": 0.34244079415621376, "3": 0.11833760266103596, "4": 0.05607963190643345, "5": 0.011305469995385719}, "score": 1.7926188279712105}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4148259103067865, "3": 0.2916911622389216, "5": 0.23129044976112645, "2": 0.04639885021064274, "1": 0.015746959184519637}, "score": 3.799551354950259}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5910364431149974, "4": 0.32573585069712124, "3": 0.07432523859091501, "2": 0.006171950281538358, "1": 0.0027110995184768385}, "score": 4.496243641363842}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4209790116943843, "5": 0.31853561155513876, "3": 0.19564873421232087, "2": 0.03980239072613224, "1": 0.025006137106006555}, "score": 3.968262792290269}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.42502845472704326, "5": 0.33207487778432504, "3": 0.18408234395250833, "2": 0.038910202020687054, "1": 0.019608651638713843}, "score": 4.011349528318034}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8432802268720367, "4": 0.11989949845319434, "3": 0.03242302695921106, "2": 0.0028444515693112236, "1": 0.0014211218273633012}, "score": 4.801010403791452}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4034195466001276, "5": 0.28364137581230087, "3": 0.20253197574249499, "2": 0.06622360556942539, "1": 0.04405304953728106}, "score": 3.8164791006163648}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4815831852235382, "4": 0.3924881238203491, "3": 0.10128901640629447, "2": 0.01662326597725606, "1": 0.007811717726039586}, "score": 4.323678737759446}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6252986145924104, "4": 0.3152161137505718, "3": 0.05218387708012442, "2": 0.00490591479895333, "1": 0.002305785222556581}, "score": 4.556435461478027}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8281715997454444, "4": 0.10876080039148035, "3": 0.04201516308582267, "1": 0.013403036409108322, "2": 0.007574268499291246}, "score": 4.730853700838117}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6321890751730269, "4": 0.2061185273854786, "3": 0.11021541610361277, "1": 0.028665659664393914, "2": 0.02269319225805834}, "score": 4.390636441214562}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7973044166346038, "4": 0.15904352056015433, "3": 0.0397971888936115, "2": 0.0019886664311244075, "1": 0.0018216997229695306}, "score": 4.7480980918783215}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7956426071138837, "4": 0.1646794042020835, "3": 0.03436751129380499, "2": 0.0026603478342017285, "1": 0.0025454355605206633}, "score": 4.748396446084276}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8442539255322477, "4": 0.1381630872395478, "3": 0.015649620679834, "1": 0.001007951122592682, "2": 0.0008891235995497352}, "score": 4.823832102657047}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2805315731792486, "4": 0.22022619538152227, "1": 0.19746182588133943, "2": 0.17941489608512262, "5": 0.12211788869967104}, "score": 2.890096210471733}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5335304414396748, "4": 0.29100535788622156, "3": 0.1346177093793583, "2": 0.02235964516516103, "1": 0.0183165730101374}, "score": 4.299294684539152}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3629502523415425, "4": 0.3474742213133293, "3": 0.18831190909355475, "2": 0.054792064714131526, "1": 0.04638706176059021}, "score": 3.925886766653294}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8660091800121178, "4": 0.11333403034001448, "3": 0.017014904223332558, "1": 0.001996696927423342, "2": 0.0015629715967074725}, "score": 4.8399472996765835}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4864692918029331, "4": 0.34798900309802294, "3": 0.12535240102425657, "2": 0.022202486319525642, "1": 0.017950756860614935}, "score": 4.26286912685367}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3932371161785118, "4": 0.2708595928313414, "3": 0.15855551414743307, "1": 0.10789061383315003, "2": 0.06902299976495992}, "score": 3.77286514739714}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9280535157728398, "4": 0.05384350475595003, "3": 0.015011261393383664, "1": 0.0017601727875615884, "2": 0.0012330105481134323}, "score": 4.905384926790854}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8303223666853129, "4": 0.13049449983054104, "3": 0.03458499021001122, "1": 0.0024350280573215114, "2": 0.0020954172096860225}, "score": 4.784294553062208}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7710521872240378, "4": 0.1783220667237512, "3": 0.04074853055277687, "1": 0.0054086594930344446, "2": 0.004387867206074853}, "score": 4.7053588583400865}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.40908296299530306, "4": 0.30139158888419415, "3": 0.1552866834138747, "1": 0.07970515621370576, "2": 0.054408330644340246}, "score": 3.905852355037221}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3805154340324039, "4": 0.23506142876423466, "2": 0.163779445628583, "5": 0.11361084621591228, "1": 0.10686499180926433}, "score": 3.084787923902938}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3448615316681062, "3": 0.317708018120587, "5": 0.2573555209587562, "2": 0.05497074194111997, "1": 0.024899528784694498}, "score": 3.7549572825202993}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3462921832570151, "4": 0.3173866919794302, "3": 0.26601986301489494, "2": 0.044114621420284904, "1": 0.025942946953818137}, "score": 3.9141933260221546}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5852982456741374, "4": 0.3292801733121126, "3": 0.07266845464190713, "2": 0.0073862656241835715, "1": 0.00516385440822475}, "score": 4.482463639736602}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.42117343521558603, "5": 0.3720097929206418, "3": 0.1677726483038771, "2": 0.025763781272233076, "1": 0.013130943958393876}, "score": 4.113333682059866}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"1": 0.636184285842278, "2": 0.2393663154044735, "3": 0.08050253535181305, "4": 0.030478483601751424, "5": 0.013336615250996418}, "score": 1.5452251392617473}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.46288416027041174, "4": 0.29640862108541877, "3": 0.1745516836181167, "2": 0.03689925196840778, "1": 0.029071478666043437}, "score": 4.127343070275976}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3508971564558138, "3": 0.2738101215128639, "5": 0.23497179342984884, "2": 0.07883415002868646, "1": 0.06130166346182002}, "score": 3.6195179484969673}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.38750335583766604, "5": 0.3265845190193034, "3": 0.18793812362152226, "2": 0.05616810555477867, "1": 0.04169579477444849}, "score": 3.901211923279848}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25710585287363563, "1": 0.22727930485068365, "4": 0.20618253712522958, "2": 0.17038576616013457, "5": 0.1387754666186649}, "score": 2.8587508057469777}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"1": 0.559002742364041, "2": 0.26762784542347295, "3": 0.12172183238099603, "4": 0.03633878684620289, "5": 0.015150829440159878}, "score": 1.680798729865601}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3642180690252126, "4": 0.3061243460288627, "5": 0.14022480418822708, "2": 0.13822365739366452, "1": 0.05109502217104321}, "score": 3.346199754474565}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.30325704493048733, "3": 0.2518500017101818, "4": 0.24827241204273445, "1": 0.10038501859899276, "2": 0.09603428652265314}, "score": 3.558094486994056}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5350185980393313, "4": 0.2909955802704615, "3": 0.12541228362981366, "2": 0.029693690405565944, "1": 0.018727969076230713}, "score": 4.294079690775122}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.29293155439555124, "2": 0.2524577679245199, "1": 0.18357114049450424, "4": 0.18004630701202365, "5": 0.09091711606313899}, "score": 2.7422608726404145}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4088888337524257, "3": 0.25754969170524783, "5": 0.2280493331427357, "2": 0.076513674690506, "1": 0.028785047807732576}, "score": 3.731059751700957}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.495569600445351, "4": 0.421072479409513, "3": 0.07292593076436735, "2": 0.007245990482452288, "1": 0.0030925802628514786}, "score": 4.398911213668777}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5909117475813416, "4": 0.341884574618961, "3": 0.06136459738142384, "2": 0.004244280360389775, "1": 0.0014731681400276164}, "score": 4.5167019325060656}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7203221618735627, "4": 0.24387887277522724, "3": 0.031842140293241915, "2": 0.0025860811981383196, "1": 0.0012621041380536616}, "score": 4.6795953778226504}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4280149945579993, "5": 0.3993139218024353, "3": 0.13469630867329538, "2": 0.02684815971110126, "1": 0.01103225526678745}, "score": 4.177841309010426}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"1": 0.32201929914527494, "2": 0.2997545217851911, "3": 0.20516008544117081, "4": 0.1322174583695108, "5": 0.04080201955091947}, "score": 2.26999434766533}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6962085867086132, "4": 0.2544113840228151, "3": 0.0443530678056466, "2": 0.0032890483873846198, "1": 0.001703400043023274}, "score": 4.640189316873838}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3745473308119881, "4": 0.348345596015057, "3": 0.22084579084662237, "2": 0.036653502098614545, "1": 0.019578011592977094}, "score": 4.021661145811944}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8513453381184815, "4": 0.12732489893091536, "3": 0.018948164733124218, "2": 0.0012489995601506097, "1": 0.0011040875850385301}, "score": 4.826610479061063}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8979181336824887, "4": 0.08636805546093042, "3": 0.013491114438236307, "1": 0.001225729625057758, "2": 0.0009764116382159168}, "score": 4.878815071272715}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.31440997243162977, "2": 0.312500378064504, "1": 0.22340893446898202, "4": 0.13132431870633005, "5": 0.018172291319211328}, "score": 2.408241708676532}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4896473504205968, "3": 0.255834507147685, "5": 0.2091228919626904, "2": 0.03456418322435279, "1": 0.010775442247317827}, "score": 3.851825449415361}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.44296678020470104, "3": 0.329231443452561, "5": 0.1489372652930305, "2": 0.06145104115433232, "1": 0.017344769288064953}, "score": 3.6447450254351073}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.40552164025793014, "3": 0.3599616431550578, "5": 0.10891966356587249, "2": 0.08806007737435183, "1": 0.03739381733969533}, "score": 3.4605791910732084}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.46309722858422675, "3": 0.28542239734109737, "5": 0.18437288926644171, "2": 0.04974278753789307, "1": 0.017299753952126094}, "score": 3.7475492600044387}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3207896713653971, "4": 0.2807375027939827, "5": 0.15017225155923056, "2": 0.1331470396719694, "1": 0.11502693047394252}, "score": 3.2179086934343353}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.36667873344860535, "5": 0.32833718354956987, "3": 0.22859980057434517, "2": 0.047646085660009684, "1": 0.028528428432765724}, "score": 3.918842902167646}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6519856672777139, "4": 0.28253888269738897, "3": 0.05830051803427926, "2": 0.00442188855173476, "1": 0.0026289230587991336}, "score": 4.577026223677769}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9133908863514802, "4": 0.07805894754204293, "3": 0.007614690019724897, "2": 0.0004919384258575523, "1": 0.0003840380199466527}, "score": 4.903693974887233}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.279386933370853, "4": 0.24139801336311034, "1": 0.20430835137418302, "3": 0.18134340138352428, "2": 0.09337804739226127}, "score": 3.2982323784416083}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4426170366061111, "2": 0.20030573593509363, "3": 0.16230352267234502, "4": 0.10381205273608371, "5": 0.09082132174144385}, "score": 2.19980259512263}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.33294092737778525, "2": 0.27232270513060564, "3": 0.2659615844475586, "4": 0.09313756362246137, "5": 0.03557084988493758}, "score": 2.2260233350335272}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.36329790730901174, "4": 0.2611088000739336, "2": 0.15078418543927194, "5": 0.13063129056332623, "1": 0.09412536641635641}, "score": 3.1833460794667903}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.28904054690545855, "3": 0.240590707110707, "5": 0.23941151203124922, "1": 0.12029254836777523, "2": 0.11057376767367509}, "score": 3.4167425959250335}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.33547125645372355, "4": 0.2782093475359308, "3": 0.20139325295072988, "1": 0.09892483100762031, "2": 0.08591246928924327}, "score": 3.6654488494531505}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4132002816936813, "2": 0.2983894400055721, "3": 0.22657793712011762, "4": 0.039852812463016495, "5": 0.021895345477992132}, "score": 1.958765845561742}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.40510766811871546, "3": 0.22330817742610268, "2": 0.16946545131285387, "5": 0.11003879429015653, "4": 0.09201225539404788}, "score": 2.332363888532367}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27000400142526626, "1": 0.2105630806932986, "5": 0.19847802306937395, "2": 0.16884465296828705, "4": 0.15198345693695606}, "score": 2.958963485910205}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9222334296269254, "4": 0.047949879053599, "3": 0.02004441334931811, "1": 0.006870124847912343, "2": 0.002822839459738574}, "score": 4.876002441776415}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.35606011500932855, "5": 0.24439678657286554, "3": 0.1837306596562804, "4": 0.11504436987847586, "2": 0.10060583711377659}, "score": 2.79107798210317}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.30941966016148226, "3": 0.2834248699301965, "5": 0.2104323405694284, "2": 0.12193788539612609, "1": 0.0746294632509429}, "score": 3.4591590575179647}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.40836405939680137, "3": 0.26436665359663614, "5": 0.2193939075969269, "2": 0.07629953767617935, "1": 0.031363954227834015}, "score": 3.708274502976539}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4530316447403287, "4": 0.3851251779529417, "3": 0.1305644636310737, "2": 0.021516702176890223, "1": 0.009688186716020541}, "score": 4.250387701425072}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6418167321407401, "4": 0.2647590001970172, "3": 0.07697171979347504, "2": 0.010067089911142753, "1": 0.006271446181350815}, "score": 4.525956459211084}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3517769039197349, "3": 0.28800869739902807, "5": 0.23684082214851512, "2": 0.08210768184256093, "1": 0.04116704999525253}, "score": 3.661082110843255}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.779052501002855, "2": 0.1579924076433401, "3": 0.04053990829693251, "4": 0.013372062987941883, "5": 0.008859204534986408}, "score": 1.3146831064525224}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29491134300429384, "4": 0.22689963405514485, "2": 0.1740297182171267, "5": 0.15631704412424258, "1": 0.14770611334751055}, "score": 3.070101321493743}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33393891231288264, "4": 0.2787339601294286, "2": 0.15285454439668672, "5": 0.14328659407352118, "1": 0.0909656514785054}, "score": 3.230572104629004}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2977487705173766, "5": 0.26898334924865136, "3": 0.24503221188454213, "2": 0.10647891443078326, "1": 0.08157608793246664}, "score": 3.5661866693919504}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.27839377797481907, "4": 0.271142002737155, "5": 0.1578356937522893, "2": 0.1524861052805699, "1": 0.14002043538349754}, "score": 3.1543052370987135}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5390132261836943, "4": 0.2088607326676983, "3": 0.2034407645021579, "2": 0.034523217854683964, "1": 0.014110317663662499}, "score": 4.224206673687405}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9473642576336203, "4": 0.04706152927168548, "3": 0.005072815449633901, "2": 0.0002594208270457026, "1": 0.00022058201105605772}, "score": 4.941130989812577}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4425701924979907, "5": 0.27478549606337965, "3": 0.2363910863396786, "2": 0.03481299647485963, "1": 0.011386731556389097}, "score": 3.9346047236492883}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5917035083769085, "4": 0.325135292064129, "3": 0.07427512312082772, "2": 0.006164624824101612, "1": 0.002702154124973598}, "score": 4.497002264128712}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7705613760224225, "4": 0.19557379553766382, "3": 0.030422950644325486, "2": 0.0020303611405546947, "1": 0.0013839417649779574}, "score": 4.731946061134217}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5306402407858275, "2": 0.2753649968707842, "3": 0.12001340909313754, "4": 0.058876579439942504, "5": 0.015019438752831375}, "score": 1.752163494303231}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.32196829532789933, "3": 0.29397128102595343, "5": 0.24229201662750702, "2": 0.09249404637950362, "1": 0.04920780646905983}, "score": 3.6156836455793515}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5266476499347303, "4": 0.3452515835592986, "3": 0.1108407491686907, "2": 0.01133115463049508, "1": 0.005883292645934726}, "score": 4.375511825663991}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3906637747725618, "3": 0.2923927927523703, "5": 0.15798128536935063, "2": 0.10448220595696318, "1": 0.05441369012885899}, "score": 3.4933494442004247}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.39795177475362187, "5": 0.3365476618355506, "3": 0.19093607362892526, "2": 0.043738537522154, "1": 0.0307118102398494}, "score": 3.965995201066333}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7007195383148762, "4": 0.24192396413141323, "3": 0.04567430924932091, "2": 0.006288923296180992, "1": 0.005357166937881362}, "score": 4.626418494158405}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.33213654981520035, "3": 0.291037137406433, "5": 0.2603347437738367, "2": 0.07707113904076258, "1": 0.039369191900716485}, "score": 3.697032229101981}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.34191920928058583, "3": 0.278731730266667, "5": 0.25176126540583427, "2": 0.08228254365947786, "1": 0.04509373300001987}, "score": 3.6731141064430783}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7389337945028628, "4": 0.2173777185756337, "3": 0.03717469095197488, "2": 0.0038204681939986453, "1": 0.002621663077974505}, "score": 4.686302361580141}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6008661388223184, "4": 0.3083663360586066, "3": 0.07311486363467828, "2": 0.01127564374864232, "1": 0.006319395652500792}, "score": 4.486269820612939}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"1": 0.45498062652665383, "2": 0.3675708462489516, "3": 0.1450880905490244, "4": 0.027240506606081318, "5": 0.005012539530482493}, "score": 1.759600279170432}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7072108680917434, "4": 0.24887353577257904, "3": 0.03813033955345779, "2": 0.003381743074166084, "1": 0.0023715512549453773}, "score": 4.655223331039067}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.34611195046507787, "3": 0.27805309342037593, "4": 0.2486587510976799, "2": 0.08137867647969393, "1": 0.04572616073037796}, "score": 3.768106472161689}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8479964241528578, "4": 0.11968358623572455, "3": 0.025998724496264784, "1": 0.003239112196993521, "2": 0.003039829654007415}, "score": 4.806234826247117}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7298959786449472, "4": 0.21134295201123854, "3": 0.049357640618034236, "2": 0.005440833570399128, "1": 0.0038984509385229073}, "score": 4.658003525191358}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2841048837556348, "4": 0.21605728459514154, "1": 0.21224400482674274, "2": 0.1591323870888499, "5": 0.12832797339345012}, "score": 2.8890780302903636}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.30460290544737645, "3": 0.27160548183894767, "5": 0.2066486233073271, "2": 0.1165696652173154, "1": 0.10050159308666853}, "score": 3.400356018649934}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29226478197842853, "4": 0.27694515189504687, "5": 0.2187092405543934, "1": 0.10925491035230037, "2": 0.10268385293179029}, "score": 3.3932258219274214}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.43364020909650836, "4": 0.35668027026205207, "3": 0.14963155597856034, "1": 0.03051754240166405, "2": 0.029431736913815714}, "score": 4.133605737013896}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.25490927026982485, "4": 0.2463785265160805, "5": 0.21949375453834014, "1": 0.15832778600298397, "2": 0.12077864366058147}, "score": 3.2479595961152308}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3098877635885798, "3": 0.26380618320123866, "1": 0.25088199245173703, "4": 0.1133902352843114, "5": 0.061962073429029575}, "score": 2.4256214208125964}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.31426254872812015, "5": 0.26402153689909, "3": 0.23994220431379684, "2": 0.1001048642435446, "1": 0.08160773743499983}, "score": 3.5790206664279274}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.43846034699699454, "4": 0.3014548576185223, "3": 0.1818004721786195, "2": 0.050751312465778, "1": 0.02747563409439212}, "score": 4.072734520866477}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.76473202548986, "4": 0.18137285394339211, "3": 0.04402739610821218, "2": 0.005396805902250721, "1": 0.0043753953392409424}, "score": 4.696851397046671}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28075356143841534, "4": 0.27482591998295697, "5": 0.2178190079050412, "2": 0.13659967651047114, "1": 0.0899122395947752}, "score": 3.3940750870803384}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4529326953155013, "4": 0.41643507994687295, "3": 0.10655659782688486, "2": 0.015822403503847893, "1": 0.008187243555311228}, "score": 4.290188706422767}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8881279486960368, "4": 0.0842726334110507, "3": 0.02301900039405074, "2": 0.0026060112065524293, "1": 0.0018697216676919087}, "score": 4.854377201042378}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.30183025172936384, "3": 0.29315945587340775, "5": 0.24500930244376398, "2": 0.102681604180035, "1": 0.057165746350437835}, "score": 3.574924090741546}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.671934952512839, "4": 0.2431128354499983, "3": 0.06622885730957578, "2": 0.011014149660811112, "1": 0.007601854867156853}, "score": 4.560932447490381}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5286328835435754, "4": 0.32025923556841324, "3": 0.10523425645326387, "2": 0.025008250213869557, "1": 0.020709525820459408}, "score": 4.311302065130091}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5062277814592859, "2": 0.21612712559522032, "3": 0.1513104639956495, "4": 0.08633455115566711, "5": 0.03977535418833782}, "score": 1.9370637041413679}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7159634434206483, "4": 0.24631952592458278, "3": 0.033412747170454324, "2": 0.002704587158386882, "1": 0.0015171155673619052}, "score": 4.672645722825371}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5615834814924695, "4": 0.31120064937484015, "3": 0.09163122326912485, "2": 0.01795759740201922, "1": 0.017492396118372274}, "score": 4.381611259914518}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7260367976307501, "4": 0.23411589697973414, "3": 0.035483399911155865, "2": 0.002631143595805469, "1": 0.0016836587941364179}, "score": 4.680273537677242}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5459312646943957, "4": 0.3149523252574105, "3": 0.10815795219230412, "2": 0.01818524914608453, "1": 0.012693464808096655}, "score": 4.363351394843549}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.646236611880506, "2": 0.19278926072324618, "3": 0.11864044859677599, "4": 0.030689914385776024, "5": 0.01152565337191555}, "score": 1.5683096382052102}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.39679174806294487, "3": 0.23801137793589836, "2": 0.18362544886967522, "4": 0.11165608516852654, "5": 0.06966766399989074}, "score": 2.273602556986477}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.559489789906434, "2": 0.20965146867999315, "3": 0.16173904109724344, "4": 0.04387581595956645, "5": 0.025125985235964498}, "score": 1.7653511739275451}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.2867137923485548, "4": 0.26907309706306387, "3": 0.22892935877082637, "1": 0.1310282408509391, "2": 0.08401976585682674}, "score": 3.4965414914298814}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.38093969394215527, "3": 0.22032891080266795, "2": 0.1633306181916781, "4": 0.13040145129351788, "5": 0.10484568253724037}, "score": 2.4147928971809103}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4729994279022125, "2": 0.2744725837691518, "4": 0.16743263294345845, "1": 0.06451619509198228, "5": 0.02042466172877293}, "score": 2.8047468161112787}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.47406380814849125, "3": 0.2919681085421224, "5": 0.14316913290925523, "2": 0.07211792157821266, "1": 0.018594649517399933}, "score": 3.6511510993330862}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.44662502797594916, "2": 0.3039039139713526, "4": 0.13056540369859612, "1": 0.09807213496574403, "5": 0.020737757633217693}, "score": 2.6719613215025837}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6923582050063652, "4": 0.259720506803, "3": 0.04141020214028858, "2": 0.003990194509581603, "1": 0.002327313455588356}, "score": 4.636108810205592}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4587802232681652, "5": 0.3147667155755001, "3": 0.18551888429254232, "2": 0.029165895926878488, "1": 0.011676628489176749}, "score": 4.035889443316999}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6677347133689318, "2": 0.2140992470943735, "3": 0.08459682014626055, "4": 0.01986812281913099, "5": 0.01358772727369247}, "score": 1.4973045440059098}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3056686520984807, "5": 0.2568377798990926, "3": 0.1914584816255848, "1": 0.14433505663278068, "2": 0.10148829574565729}, "score": 3.4292766953565765}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.42143821327823544, "3": 0.20170519061901898, "4": 0.17750716583147488, "1": 0.12731266359604537, "2": 0.07190771630897183}, "score": 3.693940102111218}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6959502785949147, "4": 0.1985854287304662, "3": 0.06602381293392137, "1": 0.02528156512575172, "2": 0.014063151095005978}, "score": 4.526005840264499}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6223417872342908, "4": 0.22909788988936525, "3": 0.09809798037829107, "1": 0.029364882246810862, "2": 0.021030615962316628}, "score": 4.394114272479232}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3140282276939176, "2": 0.24100859071655642, "4": 0.21918689747230705, "1": 0.16483327013418175, "5": 0.060837804420816884}, "score": 2.770163194299311}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.46741888188186914, "3": 0.2841215327896348, "5": 0.1840071800727471, "2": 0.04751309128090905, "1": 0.016841021716621937}, "score": 3.754312250367701}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5825362288649679, "4": 0.3263091937569461, "3": 0.07940574962005091, "2": 0.007409617947834842, "1": 0.004254198080227695}, "score": 4.475589079758991}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5128900419312986, "4": 0.4027171598655262, "3": 0.07265507761080107, "2": 0.008148924692538372, "1": 0.0035205065270309567}, "score": 4.413403826442352}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4452297668804382, "5": 0.2992445640366818, "3": 0.18502184126140298, "2": 0.04507227349088023, "1": 0.025298931938736363}, "score": 3.9481745067564358}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3123151515061888, "3": 0.3106759411261207, "5": 0.2759548537539006, "2": 0.07002869446491858, "1": 0.030938667561615205}, "score": 3.732382320811711}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4454412567110152, "4": 0.3513093867596532, "3": 0.16041316674175463, "2": 0.027299625358971034, "1": 0.015452774692739167}, "score": 4.184085939685364}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3780196880237484, "4": 0.3401237693887281, "3": 0.22218433584691616, "2": 0.038189372839220276, "1": 0.021390816170011276}, "score": 4.015285564531329}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7910063764463571, "4": 0.18683735498990553, "3": 0.02076820224933158, "2": 0.0008281854957385027, "1": 0.0005106030907512627}, "score": 4.767087794276909}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.42182818179483744, "5": 0.35799613096506155, "3": 0.1661429693755162, "2": 0.03266604564590585, "1": 0.021246351340025185}, "score": 4.062789571174032}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"4": 0.34495258713125887, "3": 0.23147493117046208, "5": 0.16221007898333092, "2": 0.13811722470818572, "1": 0.12315721118740132}, "score": 3.2849661655821443}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.498917144551623, "4": 0.3614442022207257, "3": 0.11980474337133667, "2": 0.01297813838233762, "1": 0.006792508264193696}, "score": 4.332799653597331}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4652883956239093, "3": 0.3080552281215802, "5": 0.16353451663633636, "2": 0.04952843648055842, "1": 0.013547919308712832}, "score": 3.715765723879632}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.693538448169857, "4": 0.2603514057306152, "3": 0.041460388563883725, "2": 0.0032687497716812246, "1": 0.0013228047314744202}, "score": 4.641609489486149}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3194970942132868, "3": 0.2687091529809076, "2": 0.16539541788679796, "1": 0.13369372893175957, "5": 0.11262929819593129}, "score": 3.1119812479152817}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9731348455387194, "2": 0.024036739659441836, "3": 0.0024019268730022473, "4": 0.00021467785549826514, "5": 0.00019652694723524923}, "score": 1.0302711973994092}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3039974395938607, "3": 0.29037639028734114, "5": 0.2103861767782605, "1": 0.1009985114871974, "2": 0.09406718669041696}, "score": 3.428780317820923}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3801301442605827, "4": 0.2484197060860478, "3": 0.2276082112118551, "1": 0.08301851697362458, "2": 0.06064376814404658}, "score": 3.782139706513902}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.38862615445239074, "4": 0.3042279265853414, "3": 0.1870187125540453, "1": 0.06760114217473459, "2": 0.05226551993467374}, "score": 3.894245421752358}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3241716563295041, "3": 0.2533493278785978, "2": 0.1874419652779527, "4": 0.1516703899317604, "5": 0.08320765734444557}, "score": 2.48221809768478}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4651999806186648, "4": 0.39257840647093456, "3": 0.11659372767937694, "2": 0.017341184494754268, "1": 0.008229199789037868}, "score": 4.289252916899376}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8573363702643518, "4": 0.12557596559333994, "3": 0.016340558666801803, "2": 0.0005188121429269111, "1": 0.000197015135939012}, "score": 4.839393396615597}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9161508174406561, "4": 0.0663809341517557, "3": 0.015519536955711715, "2": 0.0009555816932804151, "1": 0.0009551262760445505}, "score": 4.895888785164066}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9419715222687048, "4": 0.05282457821941573, "3": 0.0046670257246423765, "1": 0.000251274397205434, "2": 0.0002267516935950518}, "score": 4.936152260369293}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7132955559395304, "4": 0.21947081863941242, "3": 0.056655897090848305, "2": 0.006136378080779418, "1": 0.004338448427388799}, "score": 4.631416531316496}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"2": 0.35325687339960105, "1": 0.3424137766434098, "3": 0.22773855421989989, "4": 0.054514094285707894, "5": 0.02196242369074376}, "score": 2.060247122126339}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.38252024462192236, "5": 0.28400421482442006, "3": 0.1974965624715055, "2": 0.08199705065390825, "1": 0.053908182698576786}, "score": 3.760771361098063}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4786892689030868, "4": 0.34036728310146724, "3": 0.12725342606804976, "2": 0.03214814269344744, "1": 0.021478808093724978}, "score": 4.222717180193468}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6363167531999638, "4": 0.299088997314236, "3": 0.05392072320027628, "2": 0.00664991637221643, "1": 0.003979914270472772}, "score": 4.557180800817103}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7278260511968406, "4": 0.20202904596743584, "3": 0.05271891338809554, "2": 0.009001029673710317, "1": 0.00836332670348675}, "score": 4.632054053782878}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3051050913253575, "3": 0.2186635132331515, "4": 0.17952631143235778, "2": 0.17714024774830125, "5": 0.11945056203869481}, "score": 2.631034841904294}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.29078401612955646, "3": 0.23553887613976096, "4": 0.16709471026265788, "2": 0.15666826043633567, "5": 0.14962027418456858}, "score": 2.7280190408373244}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29793393848150473, "4": 0.19672033070119455, "1": 0.1884756609611909, "2": 0.17511827083294687, "5": 0.14161452858279552}, "score": 2.927869893780012}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6715168971797454, "4": 0.22867483934208188, "3": 0.07108908287672248, "1": 0.015576067146913758, "2": 0.013004440537994289}, "score": 4.5277639183480956}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8169712618132321, "4": 0.1354487823710654, "3": 0.03776019777625259, "2": 0.004892171522187942, "1": 0.00486348850102061}, "score": 4.754884642097592}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27561202740306484, "4": 0.25366220465560896, "5": 0.17260094936005382, "2": 0.15182931753905105, "1": 0.146068527639264}, "score": 3.1549328962048193}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.45039926681995485, "2": 0.2572983171848821, "3": 0.19511973172471547, "4": 0.06213343681019552, "5": 0.034924503154865075}, "score": 1.973757574396593}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.32492814935553155, "3": 0.2840237265841998, "5": 0.28203229311729017, "2": 0.0687472460975953, "1": 0.040156707159524706}, "score": 3.7400148663242123}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6589497692965312, "4": 0.2869649201889273, "3": 0.04693641807764422, "2": 0.004494980271751491, "1": 0.002609988144486993}, "score": 4.595219570678642}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.37743130513669787, "5": 0.3279555493683936, "3": 0.19593020110254972, "2": 0.05696687046691626, "1": 0.04164114241887195}, "score": 3.8931601744063022}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5114983599241475, "2": 0.28954530507467197, "3": 0.13943317845116465, "4": 0.04641573318317585, "5": 0.01301651295850279}, "score": 1.7597939865421086}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3678156931882096, "2": 0.23438769931062814, "4": 0.22514676512084944, "1": 0.12141564951190031, "5": 0.051130453519498756}, "score": 2.8501731308835665}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3504672201468087, "2": 0.2664576925863166, "1": 0.1727354060632436, "4": 0.16811271532408642, "5": 0.042066633751327374}, "score": 2.6402598002020983}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3385751846726361, "3": 0.3299545702194868, "5": 0.1373426198939328, "2": 0.13345385717865452, "1": 0.06050713421429654}, "score": 3.35885209574914}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.288172361624442, "1": 0.22827245166163534, "2": 0.20898291014537487, "4": 0.19441304214168112, "5": 0.07995850231124739}, "score": 2.688739753367716}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3551763330538345, "3": 0.29990650586939577, "5": 0.20899741406261904, "2": 0.0911668987579873, "1": 0.04465404420774498}, "score": 3.5927547405736835}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7879736884292009, "4": 0.17166824033989725, "3": 0.03321865045816884, "1": 0.0035764843006866926, "2": 0.0034650923307991723}, "score": 4.737167527931099}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.35260712577187847, "5": 0.28651668705597966, "3": 0.2614956318037616, "2": 0.06560130433987242, "1": 0.03371909786207884}, "score": 3.792648680147784}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7471517638698683, "4": 0.19276556837902764, "3": 0.04966139044494449, "2": 0.006050522179516822, "1": 0.004276589640414081}, "score": 4.672622898006887}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8419092076063189, "4": 0.14272973528468932, "3": 0.013848698803057799, "2": 0.0008548237932782172, "1": 0.000625055382596061}, "score": 4.824502474192011}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"1": 0.31772619153897835, "2": 0.26900551438982073, "3": 0.23485283383676708, "4": 0.13169803376435094, "5": 0.046570825320287355}, "score": 2.320282139517265}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4234182151789413, "4": 0.3224632186333157, "3": 0.16946397696984086, "2": 0.04788546333791125, "1": 0.03658817786157955}, "score": 4.048427540816086}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3580267051401446, "4": 0.3008568526334933, "2": 0.13660653398635317, "5": 0.12370098955246103, "1": 0.08073347352941172}, "score": 3.2502042273907406}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6299824355906846, "4": 0.2803956885527521, "3": 0.06991938803730727, "2": 0.010435018140772544, "1": 0.009177674765063855}, "score": 4.511705935566822}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4366325867986643, "5": 0.2402385478273576, "3": 0.22672562341491453, "2": 0.05783204182898358, "1": 0.038415701873913265}, "score": 3.7825679248242117}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"3": 0.33999549889625047, "4": 0.2520639383605853, "2": 0.1637975933965264, "5": 0.1514357252242915, "1": 0.09264286865660033}, "score": 3.2058653107747035}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8902048359359565, "4": 0.10095403144033688, "3": 0.008016270421432518, "2": 0.00044560600198331583, "1": 0.0003115019374540281}, "score": 4.880422500075674}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5424880996159074, "4": 0.3066522529382718, "3": 0.12937553237436925, "2": 0.015567757974568504, "1": 0.005863374428998924}, "score": 4.364406235219939}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8251172760189157, "4": 0.15293207659277713, "3": 0.019732070948716804, "2": 0.0014170948263664547, "1": 0.0007646344358377523}, "score": 4.800286600412277}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6531396783844794, "4": 0.29537008011992155, "3": 0.046318042822979695, "2": 0.0034985957684742284, "1": 0.0016018260808395664}, "score": 4.59506167741891}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6948227165899851, "4": 0.23417068650975242, "3": 0.05500567044852051, "1": 0.008005059497651451, "2": 0.007934951795051298}, "score": 4.599968511235688}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.41633931089234855, "4": 0.33533786606146954, "3": 0.17762776965092836, "2": 0.037998963345858956, "1": 0.03259380628231978}, "score": 4.064938837891711}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.35068657610480947, "3": 0.32495498952915225, "5": 0.1849910376893015, "2": 0.09002338581645566, "1": 0.04918284476137821}, "score": 3.532365375394944}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6102605206231445, "4": 0.2827876263453155, "3": 0.07855230267048423, "2": 0.014678433078713235, "1": 0.013585435217441773}, "score": 4.461657684810861}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6223578065180615, "4": 0.2759095180958551, "3": 0.07493445356736811, "2": 0.01391541166750895, "1": 0.012784484394402641}, "score": 4.481286399281918}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"2": 0.33673187111116837, "1": 0.30706077095228784, "3": 0.2553301411528865, "4": 0.08599647258700505, "5": 0.014831465615019877}, "score": 2.164764831596872}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8454070006591086, "4": 0.1363058528857777, "3": 0.01604075352146083, "1": 0.0012256291193492937, "2": 0.0009852097453686658}, "score": 4.8237482278901425}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7990767581962346, "4": 0.1518745390429619, "3": 0.04265563038675729, "2": 0.0036105144856187626, "1": 0.0027564848942409396}, "score": 4.740949962939592}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8499064367229494, "4": 0.12338940872538307, "3": 0.022416598277293674, "1": 0.0023299068284354627, "2": 0.001924969799378506}, "score": 4.816676867072962}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.43278690862550023, "5": 0.3556973678396017, "3": 0.15136281133809654, "2": 0.032767736204410855, "1": 0.027335367566243746}, "score": 4.056795810303876}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"1": 0.31884301924493785, "3": 0.2448788942088954, "2": 0.21771424038418596, "4": 0.15094437311595904, "5": 0.06725203504942834}, "score": 2.4298386654022344}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.48785949239868515, "4": 0.30549795327004, "3": 0.13145143646797988, "1": 0.040213721932358275, "2": 0.034729465586726065}, "score": 4.166349201975083}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.407508046697193, "4": 0.23880568290194823, "3": 0.19823154744492777, "1": 0.08074251618482624, "2": 0.0744656822994341}, "score": 3.81807273657642}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5745986395998807, "4": 0.2909159165870394, "3": 0.0946288766030269, "2": 0.02016756617276461, "1": 0.019535483506514618}, "score": 4.38108668361846}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4530549764708197, "4": 0.3371239540788087, "3": 0.13580492472114827, "1": 0.03935081471550577, "2": 0.0342148677448308}, "score": 4.130826804652748}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4192472238525862, "5": 0.3904915300306442, "3": 0.13908912003085697, "2": 0.029475322238929198, "1": 0.02160215069577205}, "score": 4.127657396609477}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9015079479644327, "4": 0.09380902614883653, "3": 0.004316404564486189, "1": 0.00017936010737217858, "2": 0.00015056585420688325}, "score": 4.896385224548526}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.718776225416666, "4": 0.182193913556936, "3": 0.07758948993093509, "1": 0.010836443794859337, "2": 0.010529978443387806}, "score": 4.587660904066664}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9660865331029855, "4": 0.031439871455343146, "3": 0.002131603000317886, "1": 0.00013317267014522458, "2": 0.0001152582840167941}, "score": 4.963415034067569}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9603922108370779, "4": 0.03574280102678131, "3": 0.0030520920666775087, "1": 0.00048580463523238807, "2": 0.00025552533365176555}, "score": 4.955440031314778}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28667801269996623, "4": 0.27955629316331, "2": 0.16345672542131842, "5": 0.14650796256829762, "1": 0.12366916538220427}, "score": 3.161798493751355}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5818192770528094, "4": 0.29297757755777154, "3": 0.09195995209686735, "1": 0.01692931405832829, "2": 0.01623468136571953}, "score": 4.406634224613368}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.42177929474162684, "5": 0.2557137561823687, "3": 0.23250652263596627, "2": 0.05838479982471173, "1": 0.031526528909133184}, "score": 3.811841282659464}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7076766490455589, "4": 0.2399112057835477, "3": 0.042879698221037967, "2": 0.0055649938465304125, "1": 0.003937780654646332}, "score": 4.641872667101294}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2576360110689399, "4": 0.2568720443443188, "5": 0.17715863586034405, "1": 0.16126848406746588, "2": 0.14691730522257992}, "score": 3.1417559544659976}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.32557624667085594, "2": 0.32285776783528036, "3": 0.25884770546908936, "4": 0.07206158343949433, "5": 0.02052521394640086}, "score": 2.138988542096714}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7973208731675939, "4": 0.18108194778199133, "3": 0.01898199463329273, "2": 0.0013727503456657587, "1": 0.0012044045301865234}, "score": 4.772009523420441}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8842839478019109, "4": 0.08946337100375229, "3": 0.02363577086187817, "2": 0.001508919118555081, "1": 0.0010556661389324272}, "score": 4.854508052484034}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7111674951920982, "4": 0.21907538163779422, "3": 0.05562077480180337, "2": 0.008081845734889848, "1": 0.005945069847260494}, "score": 4.621615844532517}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6827932185063089, "4": 0.2505386948318281, "3": 0.05622310418887668, "2": 0.006641981110362065, "1": 0.003719096561515358}, "score": 4.602179388153957}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6892346154763697, "4": 0.2058611637059325, "3": 0.06906936427444396, "1": 0.019888372788417496, "2": 0.01578096834675667}, "score": 4.529025758057387}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.42865239352714507, "3": 0.1991249025785008, "4": 0.1963902947531357, "1": 0.10220963803835309, "2": 0.07354263300777132}, "score": 3.7757953434839586}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.45806862493025424, "4": 0.26122277282133055, "3": 0.18527178942415484, "2": 0.049014196418820224, "1": 0.04634918364326143}, "score": 4.035723515015058}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4843106206086337, "4": 0.27022560359681713, "3": 0.15522486056628515, "2": 0.045722845703896176, "1": 0.04439156522504048}, "score": 4.104478380967052}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6263961879325921, "2": 0.1847682762175884, "3": 0.08634235615187213, "4": 0.0636495642522372, "5": 0.03871705803350778}, "score": 1.703358928697941}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2829673384038236, "2": 0.23989443657635406, "1": 0.20559022300694405, "4": 0.19803082075948217, "5": 0.07338757027530428}, "score": 2.693691377759722}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5665970885819496, "4": 0.3273506691351941, "3": 0.09192756950464806, "2": 0.008800545242872958, "1": 0.005271961945691683}, "score": 4.441275562154375}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8430652852742225, "4": 0.1391915551427618, "3": 0.016345893095682087, "2": 0.0008557360347480209, "1": 0.0005215348809239443}, "score": 4.823459781015335}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9455432414302374, "4": 0.05090314344822759, "3": 0.0031915177233045513, "1": 0.00015951046924400476, "2": 0.00015159728407333834}, "score": 4.941618010499053}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9093042830406575, "4": 0.08342361969012563, "3": 0.006221677587466333, "1": 0.0005012603155020696, "2": 0.00046307756079121766}, "score": 4.900730205867453}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"1": 0.40525068015853477, "2": 0.280848163248044, "3": 0.19787894977895285, "4": 0.08922165498229101, "5": 0.026573779033139913}, "score": 2.050804437748972}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8252630788709892, "4": 0.1581722420767067, "3": 0.014781335632314836, "2": 0.0008592929998657445, "1": 0.0008471238093734237}, "score": 4.806283810491665}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.45108212532167685, "5": 0.24552009051603624, "3": 0.23693226035230247, "2": 0.039316979699214334, "1": 0.026988452220572005}, "score": 3.848964334518415}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.45935506769872636, "4": 0.39155012442881104, "3": 0.10637607355134189, "1": 0.023234747121980225, "2": 0.019267462241750882}, "score": 4.244792832055471}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6176508554454189, "4": 0.31250437809494336, "3": 0.058096648605383494, "1": 0.006279694162040193, "2": 0.00537679019976137}, "score": 4.530010110631864}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.41857372487160854, "2": 0.3450772410183581, "3": 0.1735438628033485, "4": 0.05326431415995974, "5": 0.009456764248900976}, "score": 1.8898597969895243}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4322463753476966, "5": 0.3959961856385225, "3": 0.15003510183937196, "2": 0.013906679704418577, "1": 0.007716722127459895}, "score": 4.195016852066991}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.36687136369968865, "3": 0.30331109015118013, "5": 0.13552420770090398, "2": 0.10592711666423128, "1": 0.08830072153511521}, "score": 3.355414499105182}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4697390928550808, "5": 0.3509524271104054, "3": 0.14972470067481214, "2": 0.01964058088232631, "1": 0.009890944869939513}, "score": 4.132280642201871}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5752265590784584, "4": 0.3159638091374837, "3": 0.09119024959070574, "2": 0.010806098805763916, "1": 0.006721841024423656}, "score": 4.442299033671818}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4486943491078732, "2": 0.31038031836892804, "3": 0.16099615439955373, "4": 0.06276611633013884, "5": 0.017005184684196126}, "score": 1.8888320411285522}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3324411922308161, "3": 0.2856392294303621, "2": 0.14507583112334105, "5": 0.14095763425917238, "1": 0.09561495864338522}, "score": 3.2781261274380404}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3385498601959697, "4": 0.32476773944384657, "5": 0.2036391752490812, "2": 0.09337143646053564, "1": 0.039372731350164225}, "score": 3.5600966917857555}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6666015885820175, "4": 0.22725010133637633, "3": 0.07988892872128388, "2": 0.014039422692467399, "1": 0.012026321175031293}, "score": 4.522656056759144}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3498328534986099, "2": 0.24231011651717158, "3": 0.23636993028419878, "4": 0.13612941021230188, "5": 0.03527217745128589}, "score": 2.2646350590468605}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"4": 0.35563164103936823, "5": 0.2659684197481121, "3": 0.23469750658981972, "2": 0.07617595631535982, "1": 0.06745868112595124}, "score": 3.676521026834058}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.28328166319232473, "4": 0.26058533235713, "3": 0.2269352600942624, "1": 0.11686886321537128, "2": 0.11221455170081007}, "score": 3.4812514018135445}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7443002453334318, "4": 0.20615911611935048, "3": 0.044362702338246365, "2": 0.003218831092767735, "1": 0.0019301819613832783}, "score": 4.687729226224384}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9003900235778535, "4": 0.08602580238460351, "3": 0.011364872959076322, "1": 0.001290338102484774, "2": 0.0008877205148864009}, "score": 4.88341512949566}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.33115891933115416, "3": 0.2400821794201263, "5": 0.15881815666876106, "2": 0.13542449858149305, "1": 0.13443958002693215}, "score": 3.244510319654525}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.288011836710939, "3": 0.23915990313290933, "5": 0.16848709831242056, "2": 0.15596842438629183, "1": 0.14797469493584586}, "score": 3.1731371350196014}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3966178723474155, "5": 0.2710493151322681, "3": 0.21544746091953815, "2": 0.06545446296684224, "1": 0.05134846171094038}, "score": 3.77062863677053}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3568299647071523, "3": 0.3234344865754257, "5": 0.16415171291985617, "2": 0.10167596868154062, "1": 0.05379718158944099}, "score": 3.475915735670254}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5670852124717389, "4": 0.29798313143551464, "3": 0.09877250524018513, "2": 0.019363179117502398, "1": 0.01670019805581686}, "score": 4.379522103057262}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.30097884472767766, "4": 0.3004609150066111, "3": 0.22473285349453329, "2": 0.09283501440081719, "1": 0.0808789084727167}, "score": 3.6478992862940194}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3006855032980406, "3": 0.2048890020289369, "4": 0.18652901044710926, "2": 0.16569899827189996, "5": 0.1416436616875621}, "score": 2.702581611433375}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5763635812340169, "4": 0.2053978805885039, "1": 0.09597818048139134, "3": 0.088501073243198, "2": 0.03355177536415896}, "score": 4.132851983812424}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.28039052931954783, "1": 0.22341170475694516, "4": 0.17445877703568521, "2": 0.16652720325404416, "5": 0.15486792841915847}, "score": 2.870799594614544}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4434592784722253, "4": 0.28708716457853073, "3": 0.13688216948281792, "1": 0.08322013110716665, "2": 0.04918194472355443}, "score": 3.9585458075436675}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3539175155215439, "3": 0.18002877135572098, "4": 0.16629183367036982, "2": 0.1539694458229828, "5": 0.14535359774441906}, "score": 2.595016831145838}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4693524219457134, "2": 0.3208559854437923, "3": 0.1468997055836537, "4": 0.048562181958151984, "5": 0.014139188649062353}, "score": 1.817054359352989}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4535510258955132, "4": 0.3477894190631002, "3": 0.14952161719236937, "2": 0.030257460403594377, "1": 0.018775570418172138}, "score": 4.187207416014932}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3057315957537748, "4": 0.2983646448733596, "5": 0.18831013896992888, "2": 0.1227882072557222, "1": 0.08458874999457093}, "score": 3.383102219703059}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6739950785170336, "4": 0.2654503132185644, "3": 0.05076403233841541, "2": 0.0055674596849473075, "1": 0.0041446663011199345}, "score": 4.599709175054115}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5455176055923632, "4": 0.3402016326306493, "3": 0.09093572870173566, "2": 0.012843547934539321, "1": 0.010412196703798353}, "score": 4.397693700359029}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"5": 0.40046175907152104, "4": 0.26282012924614145, "3": 0.21626583725294363, "2": 0.06099022338688247, "1": 0.05933369036432512}, "score": 3.8841995397262217}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.39047286498160694, "4": 0.3508397543766358, "3": 0.19603299344796407, "2": 0.0425443167191987, "1": 0.019938068195685468}, "score": 4.049545555456638}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4010798677745393, "4": 0.2564542481670978, "3": 0.23499876974014516, "2": 0.07004305181886238, "1": 0.03730858566996539}, "score": 3.914059313228749}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.602361569609758, "4": 0.31903374439158155, "3": 0.06729868378177804, "2": 0.007171929164221717, "1": 0.004092775224636591}, "score": 4.5084617001894784}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8850866350973716, "4": 0.09936420905793569, "3": 0.013435305473921515, "2": 0.0011629101099072962, "1": 0.0009158060055991547}, "score": 4.866608539032463}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3325917889468296, "1": 0.30687809344857647, "3": 0.24656843432334868, "4": 0.07638464383013695, "5": 0.03742110982391394}, "score": 2.204754885359728}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.41342316416798774, "3": 0.28645890246797207, "5": 0.21071452998781404, "2": 0.06827251562871858, "1": 0.02100915886310898}, "score": 3.724649601576259}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.30927924644703814, "3": 0.30614399984275836, "5": 0.21947042359229443, "2": 0.11192447113940741, "1": 0.05301579982236424}, "score": 3.5303520926684557}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6463984110054756, "4": 0.2646900129909892, "3": 0.07124960526422157, "2": 0.011330317289108029, "1": 0.0056940244280315}, "score": 4.535747706164958}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.35284877968284006, "1": 0.27576919861728505, "3": 0.2308008641971808, "4": 0.10897230626475933, "5": 0.031496463792745455}, "score": 2.2674957326496425}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3640286156544671, "3": 0.3476654194667043, "5": 0.16526024585898855, "2": 0.08991351635764244, "1": 0.03302734249922211}, "score": 3.538637387620608}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.33497509272359355, "3": 0.31036790340449427, "5": 0.21589657616865948, "2": 0.09444659844777348, "1": 0.044245296808084165}, "score": 3.583871067110162}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3046539611726797, "3": 0.300737285800054, "5": 0.1780538938640271, "2": 0.11507410118477178, "1": 0.10138531710861688}, "score": 3.342949744920699}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4158678406252398, "3": 0.26991394311295247, "5": 0.2277524922459174, "2": 0.056143604755563126, "1": 0.03024886850494712}, "score": 3.754786772052821}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4645792600897841, "3": 0.2514985134991423, "5": 0.2091875209209667, "2": 0.053034533613570835, "1": 0.021584543481531528}, "score": 3.786841662593652}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8547435897945522, "4": 0.11335153046527388, "3": 0.027462742804489404, "1": 0.0022357512000122696, "2": 0.0021524972483800498}, "score": 4.8163125887438305}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3812010701069387, "3": 0.2898459801551504, "5": 0.24825436329445894, "2": 0.05347720984729044, "1": 0.027149202686857096}, "score": 3.7699897546455694}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6288171902858296, "4": 0.28246356787117427, "3": 0.07589653862759324, "2": 0.007020763543350904, "1": 0.005748001786279561}, "score": 4.521663256625844}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6857912210983745, "4": 0.24049304710994174, "3": 0.06407972293290688, "2": 0.005041284339986228, "1": 0.00454473663102901}, "score": 4.59802461357967}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3934035300047294, "4": 0.3201332703641208, "3": 0.1841658994775087, "2": 0.052020734473569065, "1": 0.050198948435693544}, "score": 3.954595792123503}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5457145184270051, "5": 0.13170145795774307, "2": 0.12584814465756855, "3": 0.10416693734137154, "4": 0.09217878246600426}, "score": 2.1379681872703187}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7964693509766115, "4": 0.16133335929729198, "3": 0.03440584555894464, "1": 0.00408721283361433, "2": 0.003568617546731382}, "score": 4.74276536104668}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3224192376498653, "2": 0.24254624154488064, "3": 0.20768528458169846, "4": 0.1470915348408065, "5": 0.08018472849576279}, "score": 2.420033953190931}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9494323075540461, "4": 0.04475432906757316, "3": 0.005160748767683106, "1": 0.00032121945756572736, "2": 0.00027483160316200825}, "score": 4.942811565976466}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6458961026148008, "4": 0.23020998691286848, "3": 0.08673294317054198, "1": 0.020356948006196265, "2": 0.01673335911862609}, "score": 4.464658430035314}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3926775450342854, "1": 0.19849852690816208, "3": 0.16970869000660155, "4": 0.16440983081551402, "2": 0.0744751474891544}, "score": 3.4784028765035715}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3351704066238481, "3": 0.26016165270356884, "5": 0.19467561858451113, "2": 0.1075726334037301, "1": 0.10204333530420613}, "score": 3.4130177804184445}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4771686913426082, "4": 0.26674490213618646, "3": 0.17004824297237223, "1": 0.048915258324355435, "2": 0.03704895991884257}, "score": 4.086283133792184}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4969052574155848, "4": 0.2979412081582934, "3": 0.13372417445992918, "1": 0.03755961781550077, "2": 0.03372934665314405}, "score": 4.1830692382996615}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2713421251228445, "3": 0.263978821670175, "1": 0.16908086286538399, "2": 0.15592778431052862, "5": 0.13955885040206176}, "score": 3.0563766050133045}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.745597663003042, "2": 0.17872513714096772, "3": 0.06049385435585432, "4": 0.01008733098924784, "5": 0.005005329671262819}, "score": 1.3500278997294226}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5717288491170387, "4": 0.34305547849915385, "3": 0.06775848413348985, "1": 0.009645801847492148, "2": 0.007668785655974762}, "score": 4.4597609503840205}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6044383495404984, "4": 0.2695204527626728, "3": 0.08597501054602145, "1": 0.025350546271640115, "2": 0.014638898680799341}, "score": 4.413165610055164}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7268514537812643, "4": 0.17130700179969197, "3": 0.06264426137498955, "1": 0.026178644395437954, "2": 0.012907961337918484}, "score": 4.559917306685841}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.32591163260147743, "4": 0.19469240034611662, "3": 0.18818764542009966, "5": 0.15653554033370326, "2": 0.13433346843291336}, "score": 2.721512252902128}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"3": 0.33627930481413254, "4": 0.32337627360716636, "5": 0.17910110503526985, "2": 0.11281167990742841, "1": 0.048157451343033106}, "score": 3.4725814759746534}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4101397597214025, "4": 0.34215165655184926, "3": 0.1707390178038971, "2": 0.04579916589167497, "1": 0.03101658554460371}, "score": 4.054761076547218}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.30167602570352314, "3": 0.2977760753315396, "4": 0.284119316650322, "2": 0.07951544495718657, "1": 0.0367636902089546}, "score": 3.7345383173392435}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.827942956571252, "4": 0.14085978725435463, "3": 0.02568640282619811, "1": 0.002858597097062471, "2": 0.002504590577297618}, "score": 4.7887880582194}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7113577721707259, "4": 0.19854510012539953, "3": 0.06695956160098457, "2": 0.012234309746312108, "1": 0.01074189566881952}, "score": 4.587798751681494}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.29419187160600513, "2": 0.2456846195275124, "3": 0.2415183802717312, "4": 0.15136104040356388, "5": 0.06666904678263347}, "score": 2.4503146794082937}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6559563709158599, "4": 0.25769867576655026, "3": 0.06705849371144554, "2": 0.011558035148931799, "1": 0.0076098151333414904}, "score": 4.543016768358272}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.32684981334366614, "4": 0.24664483305785498, "5": 0.18763141482613208, "2": 0.14701677251068807, "1": 0.09172757831048543}, "score": 3.2914735050327986}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5979209227377404, "4": 0.30446047597822634, "3": 0.07944977642796787, "2": 0.011024072369609783, "1": 0.006945609817049559}, "score": 4.475680900483711}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.361292572047709, "4": 0.35598036647573567, "3": 0.17607623928195423, "2": 0.06268964478042492, "1": 0.04370837271166528}, "score": 3.928693898552145}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7487395621626721, "2": 0.19346023335695856, "3": 0.04471915257007968, "4": 0.010333652257627524, "5": 0.002679285833523576}, "score": 1.324638750989265}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5647140963886379, "4": 0.30677858901838656, "3": 0.10129344283302814, "2": 0.014667736400411819, "1": 0.012307730722642676}, "score": 4.397256696425323}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5899853930094195, "4": 0.29547965320170994, "3": 0.09170588730327772, "2": 0.012862534443531195, "1": 0.00982532345637769}, "score": 4.443141041769713}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.951318181200277, "4": 0.04343810185927599, "3": 0.0042762595004374095, "1": 0.0005135993865506315, "2": 0.00036204664530710754}, "score": 4.944863779523683}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.61504238183328, "4": 0.2979851577276978, "3": 0.0646769112333463, "1": 0.011465077534299742, "2": 0.010706641811936368}, "score": 4.4946182028757}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"1": 0.45472708189780386, "2": 0.23290265556232942, "3": 0.1757920704967569, "4": 0.08882376863422616, "5": 0.047472166884960566}, "score": 2.0411406387359685}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26807277146852737, "4": 0.25689105357893327, "2": 0.16295511242437882, "5": 0.16222107719952128, "1": 0.1495157710114307}, "score": 3.1193876484686363}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3199201005968041, "4": 0.28332056043491566, "5": 0.17838495417088338, "2": 0.1256553672534424, "1": 0.09249389838914779}, "score": 3.329521486343441}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5281330174581936, "4": 0.2315256528842424, "3": 0.14306987953566788, "1": 0.05219946673240691, "2": 0.04477914326879584}, "score": 4.138947140485103}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3098962546296288, "5": 0.28624605667970454, "3": 0.21684314953496833, "1": 0.09640026773841921, "2": 0.0903161126332492}, "score": 3.599450451296595}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4104086944676333, "2": 0.2088129507985182, "3": 0.17159129871550655, "4": 0.1214024523480772, "5": 0.08744991058395335}, "score": 2.266426411773919}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5673310404699033, "4": 0.3161511680112239, "3": 0.09018766616593636, "2": 0.015096610961309237, "1": 0.0111138300029388}, "score": 4.41365817079783}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3595493633934267, "3": 0.231121507560036, "2": 0.2132613222997194, "4": 0.11010380239706867, "5": 0.08581568331268469}, "score": 2.3492786042636093}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7153771162632776, "4": 0.21259135013556335, "3": 0.05465997258704475, "1": 0.008966360738566334, "2": 0.008294410705476414}, "score": 4.617297630188635}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.32881993107914, "3": 0.26714165986169586, "5": 0.1600069543508596, "2": 0.13350376490552174, "1": 0.11037135989892867}, "score": 3.2946334150909338}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"1": 0.37334056239146896, "3": 0.18463798663408318, "4": 0.18409081193509225, "2": 0.15819574821834237, "5": 0.09938079432842978}, "score": 2.4777906150790767}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3820435506258113, "5": 0.28037188396931284, "3": 0.24678304220210084, "2": 0.049092500262148495, "1": 0.04154435613497879}, "score": 3.810739607933782}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.35822173958682335, "4": 0.2227696947842249, "2": 0.20103042785842373, "1": 0.11405729147828148, "5": 0.10360324782354774}, "score": 3.000831443681574}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5568375351319077, "4": 0.2848553703435489, "3": 0.11203608187176091, "1": 0.023876389389117014, "2": 0.022222030884608616}, "score": 4.328784969103594}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.39509697811480565, "5": 0.37946494042914286, "3": 0.17038247774658097, "2": 0.028122075671159423, "1": 0.02672613909912344}, "score": 4.072674966026982}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.339734312728988, "4": 0.28357237425994497, "2": 0.1608753882024364, "5": 0.11918337566199791, "1": 0.09656091753610198}, "score": 3.1679542690526263}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.40437884713164457, "4": 0.25145259406314946, "2": 0.1667270724819525, "5": 0.098570968287909, "1": 0.07871964782625407}, "score": 3.124446937840039}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.39378769503587563, "4": 0.27327386995616804, "2": 0.17534317943778244, "5": 0.09266904396408392, "1": 0.06483102560543734}, "score": 3.153621349837584}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6006881886277242, "4": 0.26058921510750854, "3": 0.101770632378182, "2": 0.01893197097609503, "1": 0.01795745374181464}, "score": 4.407206719441622}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.334414311881076, "2": 0.22775429149771315, "4": 0.22393863848254922, "1": 0.14049530600268445, "5": 0.07332794509314111}, "score": 2.8618400220742455}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6487802353752444, "2": 0.19237622866901627, "3": 0.1173505347282153, "4": 0.030091639598825222, "5": 0.011284152175271601}, "score": 1.562554762359228}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.26216243143820334, "4": 0.23750811207155245, "1": 0.20904201886994367, "3": 0.2032669579675411, "2": 0.08790441922126507}, "score": 3.2558742148585913}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5020061542015077, "2": 0.2009535082331914, "3": 0.1926706354439457, "4": 0.06412112539543513, "5": 0.04009644507883518}, "score": 1.9391868156599155}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2776282750969076, "4": 0.22654173285856335, "1": 0.19900436894522958, "5": 0.1602791654585435, "2": 0.13641975673001092}, "score": 3.0126731748579765}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.38188548225222924, "3": 0.21996276433003148, "2": 0.1636171551468712, "4": 0.12999170997278853, "5": 0.10438972791428446}, "score": 2.411292879541515}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9012415556722192, "2": 0.08139891787344744, "3": 0.0139256335067854, "4": 0.0024315761755180462, "5": 0.0009363408423149574}, "score": 1.1202982135693156}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3173363584416373, "4": 0.19580267247006342, "3": 0.1954321731819866, "1": 0.18210132792330722, "2": 0.10918220356161916}, "score": 3.35714241003065}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6002281176133107, "4": 0.23579091972407457, "3": 0.11674744115210993, "2": 0.02543551126663133, "1": 0.02154447232447633}, "score": 4.36806955654407}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8567798738746626, "4": 0.08746133228809669, "3": 0.03483214192292291, "1": 0.013767910784652731, "2": 0.007097501913607967}, "score": 4.766495935380759}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.2596925883491625, "4": 0.23647714835744324, "3": 0.22674564417136542, "1": 0.16237081142712373, "2": 0.11460486770416806}, "score": 3.3165503194862254}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5730920668748571, "2": 0.34183644065956487, "3": 0.07657064501745528, "4": 0.007050166820187268, "5": 0.001407024623911258}, "score": 1.5217791084415404}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8503088521710869, "4": 0.11800771208495076, "3": 0.028422070651849755, "2": 0.0018514280847127282, "1": 0.001395423954282685}, "score": 4.814009467249599}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6684449395538614, "4": 0.2545118200158282, "3": 0.0689731693504582, "2": 0.0050456439101044664, "1": 0.0029834190617327697}, "score": 4.580454028519496}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.561276149204924, "4": 0.31074038199859777, "3": 0.10643771506349033, "2": 0.012697051218461554, "1": 0.008812218981291297}, "score": 4.403022378440976}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.34480977183687533, "4": 0.298588472434205, "3": 0.251218600638917, "2": 0.0701129125535181, "1": 0.035050955668857235}, "score": 3.848179186773777}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3468451681186205, "3": 0.23616362214831554, "5": 0.21269133409278332, "2": 0.10289849110008868, "1": 0.101237331683384}, "score": 3.46693128324828}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4534328005544051, "4": 0.3017905033027024, "3": 0.1667424287524735, "2": 0.046415083367460024, "1": 0.031549264577910935}, "score": 4.099219348695077}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4779775328505671, "4": 0.22926438998020457, "3": 0.20939999592626973, "2": 0.05403953881867101, "1": 0.029021045653725416}, "score": 4.0734571755982945}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.2951045141890368, "3": 0.2745618293122121, "5": 0.20558907170491886, "2": 0.13217565781818982, "1": 0.09239659053381213}, "score": 3.3893809232358874}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.28843627537916955, "5": 0.24589472052465755, "3": 0.22047913817994516, "1": 0.13102632785258755, "2": 0.11402757202073577}, "score": 3.4042004462377884}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5438797523685835, "4": 0.36140477080928607, "3": 0.07693460528390209, "2": 0.011197012246211249, "1": 0.00638586707481089}, "score": 4.4254777626534265}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5543138147451491, "4": 0.36203466937067147, "3": 0.07210057209350763, "2": 0.007698136441489395, "1": 0.0037993943748151297}, "score": 4.45544311321555}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.497714156340968, "4": 0.344315565685795, "3": 0.12978375975369066, "2": 0.016598764734048595, "1": 0.011465439836474167}, "score": 4.300373287362605}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8872700320735558, "4": 0.09803211008988393, "3": 0.012515100797447389, "1": 0.0011499555379575577, "2": 0.0009467831284815081}, "score": 4.869486290201018}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6679674594701933, "4": 0.2514254889345022, "3": 0.06228514030609461, "1": 0.009275268705174358, "2": 0.008962644055925676}, "score": 4.5599782622865295}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2790778789752501, "2": 0.2733117210082818, "1": 0.268822545290976, "4": 0.12485277947364444, "5": 0.05379497595021174}, "score": 2.4214048590086508}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.33636291424153053, "3": 0.22457516885056508, "2": 0.22429949251194917, "4": 0.11875294931962672, "5": 0.09583855710276311}, "score": 2.4133044657183236}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.33234476502839183, "5": 0.2781938795262225, "3": 0.26848882124413415, "2": 0.07657915248869801, "1": 0.04398955322317899}, "score": 3.72446682548952}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5157493950414774, "4": 0.270171374760221, "3": 0.14428941067365675, "2": 0.0373495804648699, "1": 0.032134951802641996}, "score": 4.200417152833026}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.40893473818947057, "4": 0.26611160247863713, "3": 0.226659859851028, "2": 0.061000360804405414, "1": 0.03699872967631032}, "score": 3.9492630150545964}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3537493738717881, "4": 0.2453830058299449, "2": 0.17499609842875183, "5": 0.11300775887684723, "1": 0.11278359329605972}, "score": 3.0708409178576606}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6566241790275362, "4": 0.2547044055831676, "3": 0.06827872871033173, "1": 0.011100328239221824, "2": 0.009236751725446714}, "score": 4.536600800756065}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5095900500165823, "4": 0.24235843797189405, "3": 0.15250263567031327, "1": 0.05087469145522148, "2": 0.044597101984200506}, "score": 4.11527802197665}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.24677544140145397, "4": 0.21373913561269034, "1": 0.21349751195242073, "2": 0.17429481054856355, "5": 0.1515816583849552}, "score": 2.915603212573979}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3699423116349246, "3": 0.23672922536888333, "5": 0.2145076021464286, "2": 0.10102805787275565, "1": 0.0777323316038398}, "score": 3.542497600422184}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.39077147217761454, "3": 0.2677071553032504, "5": 0.16119691287379, "2": 0.11445604684892254, "1": 0.0655570580679926}, "score": 3.4677407682401573}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31434882563871025, "4": 0.24531995050040353, "2": 0.18733751423971545, "1": 0.12925161118801481, "5": 0.12334240631518642}, "score": 3.04618248529039}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3205483679394953, "4": 0.26312928227462834, "2": 0.17827392626499017, "5": 0.13260480037003683, "1": 0.1052794748020421}, "score": 3.1395289105859105}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7237022486190402, "4": 0.23523198066168627, "3": 0.036145139249960614, "2": 0.003317950519744612, "1": 0.0014737958433465824}, "score": 4.6765870227898505}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3309700801456234, "5": 0.27116285435890003, "3": 0.23966031796378742, "2": 0.09389620583756399, "1": 0.06421473997582619}, "score": 3.651032473103799}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6287912018084106, "4": 0.24753361203306906, "3": 0.09710154426007937, "2": 0.014199045996171918, "1": 0.012342204867585922}, "score": 4.466280054246639}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6639889640834984, "4": 0.2913339428017634, "3": 0.03908498895105678, "2": 0.00288203827726284, "1": 0.00256276634604241}, "score": 4.611541679348077}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.378601177526169, "2": 0.2418462464477523, "1": 0.17708197819265958, "4": 0.15063477207427034, "5": 0.05176776607269677}, "score": 2.6581368342867244}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9437881692484316, "4": 0.052906059519258426, "3": 0.0028714458373012876, "1": 0.0001826632982667353, "2": 0.00014458644413090083}, "score": 4.9401802310398795}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3795874400965105, "4": 0.3606324439970214, "3": 0.157244823950089, "2": 0.05313903491464961, "1": 0.04924512997547795}, "score": 3.968324369345556}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4723247973833664, "4": 0.2221799810766104, "3": 0.2007156197199751, "2": 0.05729720126483298, "1": 0.04737808021321086}, "score": 4.014882086998499}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4454581838003829, "4": 0.25851359358860587, "3": 0.17271341824560607, "1": 0.06540325180278155, "2": 0.057642035180449726}, "score": 3.961240493424787}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8196734661856488, "4": 0.10043667997981255, "3": 0.06469767585439558, "2": 0.008521328696555116, "1": 0.0065886796970609385}, "score": 4.718226110189468}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6017287599952953, "4": 0.2966249004011161, "3": 0.08078399619229287, "2": 0.011758322397046266, "1": 0.00892884706938945}, "score": 4.470724036387137}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.511264525649693, "4": 0.29808091574157686, "3": 0.13196743386214946, "2": 0.031237343276266216, "1": 0.027356453997002636}, "score": 4.234774954197274}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6587225564712893, "2": 0.2606112097654251, "3": 0.06410264834976634, "4": 0.012677645922605934, "5": 0.0037634206041209295}, "score": 1.4419572747625733}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7508747190314966, "4": 0.19998392313301885, "3": 0.041499425301416905, "2": 0.0038682866348006217, "1": 0.0037251859832788084}, "score": 4.690496623919028}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8711168543428657, "4": 0.09136783290944547, "3": 0.0318223151824476, "2": 0.003022048700320067, "1": 0.002633093995743893}, "score": 4.825382404515491}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8502701384903711, "4": 0.11860729322507223, "3": 0.026249500990786347, "1": 0.0026750221989385067, "2": 0.0021726507785237354}, "score": 4.811670881172816}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8369524082714394, "4": 0.13599927828338254, "3": 0.02354301277489021, "2": 0.001893715323305603, "1": 0.0015853580470046472}, "score": 4.80488700072174}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4697577935406021, "2": 0.2560985109817307, "3": 0.1501135456866169, "4": 0.08402317712856888, "5": 0.03982494516842119}, "score": 1.9678710935640908}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5862077089941625, "4": 0.2666256938099774, "3": 0.1073790157581115, "2": 0.019967314845679936, "1": 0.01968938344351279}, "score": 4.379875632532999}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.25118483912781553, "2": 0.2269149049143754, "1": 0.21732390251521766, "4": 0.15240421174338672, "5": 0.1520694126809072}, "score": 2.7949592635268217}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7039111768720062, "4": 0.22214323554667945, "3": 0.056489347411233626, "1": 0.00919630045736699, "2": 0.008193959848330386}, "score": 4.6034848262390025}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.47812812905212804, "2": 0.24943448086997022, "3": 0.14777264038778992, "4": 0.07701503626681225, "5": 0.04737804704856631}, "score": 1.9657994338711713}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3417596044644165, "3": 0.2953623710614341, "5": 0.15856900779583363, "2": 0.12174499824986068, "1": 0.08233908295491552}, "score": 3.372558257464456}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7814911371530098, "4": 0.18419030307589218, "3": 0.02802256501420963, "2": 0.0033775742657252846, "1": 0.0027758271614539568}, "score": 4.7384912460487225}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.37125040424143585, "5": 0.32689573896864044, "3": 0.23062409230499278, "2": 0.050085586845296536, "1": 0.021051728672848706}, "score": 3.9329390872424126}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7052638294533883, "4": 0.22701921897420885, "3": 0.05588443954022424, "2": 0.006859731348756791, "1": 0.004894980434722454}, "score": 4.6210233016788}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.36002366988962314, "4": 0.3254330246334797, "3": 0.1906437835155203, "2": 0.07105368932717519, "1": 0.05269868375145279}, "score": 3.869157203094013}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5748854358707596, "4": 0.2387172217848669, "3": 0.11913248331108782, "1": 0.037058656900448024, "2": 0.029811737117830757}, "score": 4.285065956169344}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6160006686367111, "4": 0.27465832729273465, "3": 0.07737877970456425, "1": 0.01818519822745821, "2": 0.0136392951925815}, "score": 4.456850626333533}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9495537448634536, "4": 0.04334183257849893, "3": 0.006129031714461039, "1": 0.00044166287197662865, "2": 0.0003888171796545044}, "score": 4.9414585176731425}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8182095840310627, "4": 0.1336024072103998, "3": 0.03837247013763846, "1": 0.005456176550510398, "2": 0.00417845089674097}, "score": 4.7552483153075285}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6324576165707491, "4": 0.23260559151478216, "3": 0.08820196829046241, "1": 0.02795741274651008, "2": 0.018577425837516835}, "score": 4.423313214675884}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5515388491874097, "2": 0.2552946016708434, "3": 0.1372286728140005, "4": 0.039962794308758466, "5": 0.015798194778532823}, "score": 1.7129592227287165}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.27383314991241375, "1": 0.26714411757627204, "5": 0.16578846673653327, "2": 0.14746796695119746, "4": 0.14570016985438747}, "score": 2.795507378337434}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.42522716371273306, "3": 0.2272749638574176, "2": 0.22162936928858265, "4": 0.08253899752953434, "5": 0.0431964527228721}, "score": 2.0967280233153054}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2902090075217902, "1": 0.2879841025064871, "2": 0.27907637195877266, "4": 0.10538314186733702, "5": 0.03719892931396142}, "score": 2.324636167902426}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7488950390982434, "2": 0.19058297784759853, "3": 0.045783294651421745, "4": 0.010154323536542017, "5": 0.004529771419644181}, "score": 1.3307496802036327}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.29860382027612425, "3": 0.2928422531792783, "1": 0.25674916047341084, "4": 0.11614803937733621, "5": 0.0354532270187109}, "score": 2.374825129308721}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.28051370388718005, "3": 0.25036928775857487, "4": 0.23564291307712937, "2": 0.11750631525396239, "1": 0.11572558928069962}, "score": 3.447821285205678}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3205747180983166, "2": 0.293879782008731, "3": 0.2652684624372029, "4": 0.08709101131911835, "5": 0.03307273010694389}, "score": 2.2181186692771844}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.2795069837824112, "1": 0.263127519314343, "3": 0.25238592866697984, "4": 0.16525975007899465, "5": 0.03944115755131592}, "score": 2.438223497790012}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.42952827816195904, "2": 0.2640962655676403, "3": 0.18956835634587438, "4": 0.0845691276808486, "5": 0.0321111903680436}, "score": 2.0255151395069872}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3415206955172639, "3": 0.2121606093211361, "2": 0.20755606147897596, "4": 0.17308219183417164, "5": 0.06550539980289789}, "score": 2.4133928580123936}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3907850556300665, "2": 0.25054598561392805, "4": 0.18165950423383642, "1": 0.13571015238733244, "5": 0.04119048483115491}, "score": 2.7420461136611674}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.38879868056894645, "5": 0.2891020901889448, "3": 0.22719122846243023, "2": 0.057054975129473835, "1": 0.03777193546966452}, "score": 3.8344716823374094}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6208699867989657, "4": 0.2537990415773391, "3": 0.10160722847104349, "2": 0.01489572529716584, "1": 0.00873329540352894}, "score": 4.463315307884995}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.38847612708778057, "3": 0.33984460838691666, "5": 0.11481843779756812, "2": 0.11210691105516825, "1": 0.04468687699480881}, "score": 3.4166602699917052}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4395559571230369, "5": 0.36976853506745994, "3": 0.14738284352457803, "2": 0.025240791067038786, "1": 0.017940719809425805}, "score": 4.118095076650819}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3604118405050612, "4": 0.2370338312841853, "2": 0.19939701330037543, "1": 0.10900079534897801, "5": 0.09409045238236972}, "score": 3.0078166484745075}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.38243919716936786, "4": 0.34238241297794697, "3": 0.21338590328604967, "2": 0.040671771585676385, "1": 0.021036947130514298}, "score": 4.024600970090805}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.73841238734982, "4": 0.2124049467716926, "3": 0.04165536113188996, "2": 0.004442695465128314, "1": 0.0029863167712785347}, "score": 4.678979423565747}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2613163595789428, "3": 0.25738576200909574, "5": 0.18425220141606447, "1": 0.15249398901600572, "2": 0.14443596766311328}, "score": 3.180417694708731}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4082812515625539, "2": 0.2973424423004101, "3": 0.20077411677416832, "4": 0.0675858795600456, "5": 0.025922983758072966}, "score": 2.005434082747374}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.35104505567772176, "2": 0.28730977210019565, "3": 0.235234991650309, "4": 0.09544264383842853, "5": 0.030865414307881867}, "score": 2.16768859133876}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3555823183513636, "4": 0.27540707585705876, "2": 0.18023334617717343, "5": 0.09755275211093577, "1": 0.09103188948061286}, "score": 3.1082363032032556}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5200449285922942, "4": 0.33765051422826986, "3": 0.11469916898393975, "2": 0.01825180316997806, "1": 0.009172246858405942}, "score": 4.341387319243927}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3081123160443838, "3": 0.29950316316398035, "5": 0.15693433649585628, "2": 0.14205743945017243, "1": 0.09322593718792159}, "score": 3.293520636699971}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2840294355184787, "4": 0.21667704628006998, "1": 0.2116880182971873, "2": 0.15846083721691293, "5": 0.1290109234885046}, "score": 2.8928476889815613}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3315794267553153, "5": 0.32289912856443825, "3": 0.21650446677439983, "1": 0.066027477357226, "2": 0.06290023998130197}, "score": 3.782492334898173}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2943882807955711, "4": 0.26600533872689097, "5": 0.20046762832678156, "1": 0.12789687549198517, "2": 0.11116792311217984}, "score": 3.3000011074301794}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6416307606003435, "4": 0.2534611302638505, "3": 0.0794840107651998, "1": 0.013703220510697885, "2": 0.011617647508393674}, "score": 4.497853186845743}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.28671855183701145, "4": 0.2518610833540514, "5": 0.16790626528837554, "2": 0.14697232136003355, "1": 0.1464294992710204}, "score": 3.1478588954613143}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5010523461609943, "2": 0.2780766455148057, "3": 0.12220753169239043, "4": 0.06907617484951725, "5": 0.02918694379525346}, "score": 1.8468070345889305}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4998877528812743, "4": 0.310576851306568, "3": 0.12463331908365353, "2": 0.032527428230968713, "1": 0.03224826614923649}, "score": 4.213481759214022}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5845197553057669, "4": 0.25101120485252826, "3": 0.1393598698208111, "2": 0.01758848768090803, "1": 0.007438859759604774}, "score": 4.387698053299454}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.32105667943192634, "1": 0.3156610397893404, "3": 0.22963975053823096, "4": 0.11248588858559219, "5": 0.021106426740897796}, "score": 2.2022799256118395}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3447286821150644, "5": 0.30447393342867207, "3": 0.21300796917616321, "2": 0.07577582262076513, "1": 0.061916764745987445}, "score": 3.7541402186834154}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"2": 0.27360631838170735, "3": 0.26045627035477786, "1": 0.2429739118613992, "4": 0.15664372810768276, "5": 0.06614521014748305}, "score": 2.52929783998922}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.38539981616496494, "2": 0.24256656777157906, "4": 0.18104647730286771, "1": 0.13356406882135244, "5": 0.05730150444623042}, "score": 2.785928757104864}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.36058127388382355, "4": 0.20765290896957672, "2": 0.1606632531146062, "5": 0.15359775104651593, "1": 0.11730342794584132}, "score": 3.1196023881880053}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7680194504871679, "4": 0.1776511825338435, "3": 0.04353280008843719, "2": 0.005585615760426613, "1": 0.005148557503235283}, "score": 4.697913291709697}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5153224591432151, "4": 0.3409616061408117, "3": 0.10802733305884989, "2": 0.018792507985172676, "1": 0.01678907335009034}, "score": 4.319377069900565}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4985732547626319, "4": 0.336157492889561, "3": 0.14317914078141664, "2": 0.013934706226098692, "1": 0.008101808261970501}, "score": 4.30323552928152}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9634648917862101, "4": 0.03276053464747323, "3": 0.003349752555175392, "1": 0.00027969551302044475, "2": 0.0001330470144634206}, "score": 4.95902154218907}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.778698432010633, "4": 0.18422476830571938, "3": 0.03237335082591452, "2": 0.002354394493170815, "1": 0.0022491295596368224}, "score": 4.7349423424896715}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9472955676890132, "4": 0.04445212551745539, "3": 0.007543107851419619, "1": 0.00036363534205984113, "2": 0.00032579767438154427}, "score": 4.938028499464249}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9510368980291345, "4": 0.04353016208068428, "3": 0.00484385348715879, "1": 0.00033640098560819184, "2": 0.0002248886875893911}, "score": 4.944760325457489}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3552471978008023, "3": 0.30578287124171216, "5": 0.1707090898773355, "2": 0.10565678663727278, "1": 0.06240525452628344}, "score": 3.466290780433892}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.699682834631589, "4": 0.23247801908359453, "3": 0.0642099047879531, "2": 0.0026476672756280887, "1": 0.0009618670678065627}, "score": 4.62730435647216}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6063826842853998, "4": 0.31921653926782373, "3": 0.07037404941767562, "2": 0.003105027832092475, "1": 0.0008651823188542899}, "score": 4.527232829800577}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8895789438493801, "4": 0.10220254493560672, "3": 0.007765817094779819, "2": 0.00024245631697470305, "1": 0.0001734864603415059}, "score": 4.880840126797181}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4093083602358917, "5": 0.40514361491686374, "3": 0.15527890374591793, "2": 0.020691121164054853, "1": 0.009492037402432315}, "score": 4.180021831768524}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3377474000584097, "3": 0.30675861838229274, "1": 0.26689597586471253, "4": 0.07606506397579169, "5": 0.012393687606253936}, "score": 2.229205751131388}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8216930271203581, "4": 0.1543921476305236, "3": 0.02127538092213053, "1": 0.0014669718042687999, "2": 0.0011239275352579732}, "score": 4.793807411085723}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6822617753229616, "4": 0.2517754651416319, "3": 0.05999544717834579, "2": 0.0032861355810771377, "1": 0.002595702723466561}, "score": 4.607958913524165}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7909950967758532, "4": 0.17702958738691432, "3": 0.02761994837829561, "1": 0.0023102593223306546, "2": 0.001978875747164632}, "score": 4.752536461224206}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5916024185518169, "4": 0.33250323154537437, "3": 0.06422098837400547, "1": 0.0060188504081398865, "2": 0.005586716235124615}, "score": 4.498185220893169}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29943126108669443, "2": 0.26856156471846787, "1": 0.2204198593100898, "4": 0.16458413180059997, "5": 0.04692991314090118}, "score": 2.5490096307049916}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5352737771425871, "4": 0.29039064811813114, "3": 0.12667440812766692, "2": 0.026625986606390803, "1": 0.020936678625358203}, "score": 4.292566178098308}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5601826431195562, "4": 0.3109506378935089, "3": 0.10959243835058013, "2": 0.011626195431249391, "1": 0.00758556636413161}, "score": 4.404606410337907}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8692120042562933, "4": 0.11366231222176076, "3": 0.015258447421686437, "1": 0.0009329219644537004, "2": 0.0009055047816328745}, "score": 4.849368251128752}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.41099470819777334, "3": 0.23587489982235738, "5": 0.23348643448145814, "2": 0.07803249004362554, "1": 0.04153287070844086}, "score": 3.71692569372708}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.29756532448480805, "3": 0.24919628497124646, "5": 0.19145683508972292, "2": 0.14064331141415035, "1": 0.12083419045016493}, "score": 3.298257988761975}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.27910665338786794, "1": 0.27353237258807306, "3": 0.25025449472726274, "4": 0.14967110882548396, "5": 0.0472597923978327}, "score": 2.417917094061905}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3750219205200513, "5": 0.28733040168242563, "3": 0.25022283953591284, "2": 0.059399931845283256, "1": 0.027778870534163256}, "score": 3.834930473826966}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.37748160120900875, "3": 0.24657408080514667, "5": 0.22216833915062312, "2": 0.0909996152951543, "1": 0.06263606804145738}, "score": 3.605631495504822}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2859409379937156, "4": 0.26668694476624855, "2": 0.2041353754662073, "1": 0.13885765990337048, "5": 0.10420689302285417}, "score": 2.9932488730702422}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7081514894688506, "2": 0.20972922185912823, "3": 0.05750072629736985, "4": 0.01540313837100471, "5": 0.009003991499666627}, "score": 1.407042117499677}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.615765173487054, "4": 0.3287960267390838, "3": 0.049783767594653, "2": 0.003912239135387741, "1": 0.0016470787742483702}, "score": 4.553268647003306}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5122485871463357, "4": 0.39487283603560264, "3": 0.0851587770223477, "2": 0.0054968982520412395, "1": 0.0021041472517130204}, "score": 4.409832241202392}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6074914548238152, "4": 0.3356582666905075, "3": 0.0507465572905834, "2": 0.004048977090547937, "1": 0.001981682594391375}, "score": 4.542741549086161}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5760462882326742, "4": 0.307841727450483, "3": 0.0934471073075506, "2": 0.014378934865240741, "1": 0.008087510668674051}, "score": 4.4296640380576076}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4482788532108132, "2": 0.2905711529439128, "3": 0.16783450070073833, "4": 0.07351863260943567, "5": 0.01966645473478429}, "score": 1.925582572448952}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.3477073852154159, "2": 0.3443119159601423, "3": 0.23660398140529382, "4": 0.06048647455579985, "5": 0.010740549793613052}, "score": 2.0420974963857788}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.25697486510952827, "1": 0.24035203929239624, "2": 0.20858500979489739, "4": 0.2046173355644309, "5": 0.08925355742616922}, "score": 2.693768850832493}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.38737266137546206, "4": 0.31338102390998773, "3": 0.2109095521931183, "2": 0.052250892862798236, "1": 0.03591853577073358}, "score": 3.964199725545434}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.30902966606805643, "4": 0.26511727598656004, "2": 0.1750908319498, "1": 0.1486435828493449, "5": 0.10184791579442982}, "score": 2.9964341445523277}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3070873021490293, "4": 0.21773259446826412, "3": 0.20119159821564572, "1": 0.1713654103117707, "2": 0.10245840168473344}, "score": 3.386781676758707}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.29566524313581755, "3": 0.2024292168420822, "2": 0.19278534714097648, "4": 0.16401317811933344, "5": 0.1449837082167441}, "score": 2.6698240482843465}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.27944781841681937, "1": 0.21556072986946992, "4": 0.18205881222713782, "2": 0.1766921899719054, "5": 0.14599873816742773}, "score": 2.866210300362602}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7055066159908001, "4": 0.18121949551833189, "3": 0.0752941000376258, "1": 0.023387436558730917, "2": 0.014523721511215976}, "score": 4.531039208678986}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.725229153699552, "4": 0.14721732243874852, "3": 0.0758234930239984, "1": 0.03460056041791717, "2": 0.01698864668653901}, "score": 4.5116987453763455}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"3": 0.42752822901575444, "2": 0.21722432579044432, "4": 0.17472284558745246, "1": 0.1215834281984442, "5": 0.05886369865357047}, "score": 2.832046048852064}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3192619989396672, "1": 0.20746463242158872, "4": 0.1905506196052525, "2": 0.15332623081679167, "5": 0.12924001783846073}, "score": 2.8807564979690343}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4312572194599487, "4": 0.2404261993351164, "3": 0.2342639518450165, "2": 0.055657318526338616, "1": 0.038276834849433}, "score": 3.970844671807755}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.632853842514653, "4": 0.2702229553988781, "3": 0.07749522170058, "1": 0.009927565471670046, "2": 0.009349896549194719}, "score": 4.506952436952629}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2557471034303682, "4": 0.23718562892821465, "1": 0.19113079399114874, "5": 0.1795195972738658, "2": 0.13619983455342846}, "score": 3.077780282514529}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4688057619246329, "2": 0.3107500772497612, "3": 0.16946246874715742, "4": 0.04347567903010211, "5": 0.007387068554895415}, "score": 1.809746640957996}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5803948448939033, "4": 0.29134087663211433, "3": 0.10740178252264397, "2": 0.013318622967931225, "1": 0.007493547215787211}, "score": 4.4238965077051775}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6891403828697545, "4": 0.24590905660475684, "3": 0.05478178668690026, "2": 0.00581204378355399, "1": 0.00429525480218753}, "score": 4.6098862371198175}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.36731584057885736, "4": 0.34607436474819875, "3": 0.19302727091141877, "2": 0.05007002266370413, "1": 0.0434534947054464}, "score": 3.9437847231630094}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5008754558093942, "4": 0.2957869344196324, "3": 0.13861377644719447, "2": 0.03264048140719668, "1": 0.032019044902907134}, "score": 4.200936503465561}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"1": 0.915620025218435, "2": 0.07101276708553733, "3": 0.010827923199759695, "4": 0.0014229743291328562, "5": 0.0010434716500000798}, "score": 1.1011187884150582}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.23898201044217174, "3": 0.23652598593088497, "5": 0.1950097542255393, "4": 0.17127815612946246, "2": 0.1580731940093632}, "score": 2.925250665054012}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5958939464192311, "4": 0.18094497490232955, "3": 0.10934874596601175, "1": 0.07388146458585977, "2": 0.03971938195386964}, "score": 4.185501273742315}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8721587839186514, "4": 0.09672158357814767, "3": 0.02218475805506511, "1": 0.0053492409855435755, "2": 0.0033999960810263304}, "score": 4.827279884816542}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.27256447155503555, "4": 0.24208424344349286, "3": 0.21455943344407583, "1": 0.14326420012899985, "2": 0.12727681739735835}, "score": 3.3735016558241364}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.28559781474473195, "1": 0.2176608416306446, "2": 0.1987604993350431, "4": 0.18689029351096162, "5": 0.11089538495103214}, "score": 2.774554881633592}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.639377347965936, "4": 0.2194655075098663, "3": 0.1083910129260269, "2": 0.018342338722005597, "1": 0.014313884052284885}, "score": 4.451409619339392}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7248363019759119, "4": 0.14594633402753154, "3": 0.09496581445352544, "2": 0.01927015987529467, "1": 0.014898697290809133}, "score": 4.546679282108624}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.43717423773464636, "4": 0.26150465355868324, "3": 0.1761697077418033, "1": 0.07653465761673388, "2": 0.048535038430899284}, "score": 3.934325114319744}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6078739850065429, "4": 0.211561784047381, "3": 0.12216777183085803, "1": 0.030219846547386166, "2": 0.02807846967677453}, "score": 4.338922997062754}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.357945478096305, "4": 0.32830074014484223, "5": 0.1647776647699909, "2": 0.09842270103069324, "1": 0.05048087133013846}, "score": 3.458504888060408}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7215219561333339, "4": 0.23822332617697028, "3": 0.03623626014552258, "2": 0.002603862394307604, "1": 0.0013761938087597163}, "score": 4.675975348132839}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5127629122482792, "4": 0.2786700537595162, "3": 0.165155999537025, "2": 0.0276710787410493, "1": 0.015648910203183087}, "score": 4.245340361758199}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9314145471228987, "4": 0.06391516639410853, "3": 0.004260809982659642, "2": 0.00018665678533680852, "1": 0.00016532935213930012}, "score": 4.926337691003132}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8494324996025909, "4": 0.13319978966082907, "3": 0.015532159469613352, "2": 0.00098111684248707, "1": 0.0007798445133584536}, "score": 4.829660457207692}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9106978857289515, "2": 0.08036509008608388, "3": 0.007930871898578405, "4": 0.0005173142678246796, "5": 0.0004181913312093936}, "score": 1.0994585684299405}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8424177058860536, "2": 0.1468715622962769, "3": 0.010003376429766538, "4": 0.0005440014748449317, "5": 0.00013620192918435768}, "score": 1.1690597176038082}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.47620378339039754, "2": 0.327808297599032, "3": 0.1558201221753039, "4": 0.03126224936261443, "5": 0.008815365505088699}, "score": 1.7685660628575886}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3490971251283548, "5": 0.23905137308563482, "3": 0.23885220678025618, "2": 0.09586675695425749, "1": 0.07687493487579068}, "score": 3.5777320702097786}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.35595555550886465, "2": 0.3076486788908645, "3": 0.21128319267477821, "4": 0.10132858762385842, "5": 0.023695327551579427}, "score": 2.129082239209269}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.31367505048172106, "3": 0.27271123250724005, "5": 0.17051711603414413, "2": 0.14192912013195816, "1": 0.10099357278073805}, "score": 3.3108470756697663}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.2725797901087843, "3": 0.2692079364591407, "5": 0.23270158438380822, "2": 0.1228065409036383, "1": 0.10260204650519497}, "score": 3.4100141880831667}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6794595610265096, "4": 0.21374680898539505, "3": 0.08510893115220357, "2": 0.011584028303670961, "1": 0.01002242697079476}, "score": 4.5411576344551925}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6157427354129563, "4": 0.26044257071526083, "3": 0.09666464100596454, "2": 0.016217506047134907, "1": 0.010804344037808876}, "score": 4.454288291221549}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.461051402514844, "4": 0.31011319592752534, "3": 0.15470588202288282, "2": 0.03841712328117847, "1": 0.03558428397405055}, "score": 4.122774150883788}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"3": 0.32711627181031666, "2": 0.20005601032824827, "1": 0.19665113666079923, "4": 0.18062457013386293, "5": 0.095252187439017}, "score": 2.7777040117724243}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3441474774371564, "3": 0.33555073900871435, "2": 0.13390889477498305, "5": 0.11130823880889845, "1": 0.07492977031037347}, "score": 3.28303935669852}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3725987036577933, "5": 0.3260169516633492, "3": 0.23447926902838054, "2": 0.04182579602554436, "1": 0.02489874446189093}, "score": 3.9331777934402514}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5238933478575885, "4": 0.3648349206125468, "3": 0.09035689052937057, "2": 0.01184126279772832, "1": 0.008912718298690264}, "score": 4.383177414718866}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.48145019031522174, "4": 0.33079838432137, "3": 0.13256621798713814, "1": 0.02787438812821725, "2": 0.02721035444485631}, "score": 4.210861283191036}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"1": 0.36262084308685016, "2": 0.22020551711263586, "3": 0.21350176059518244, "4": 0.12313314861932476, "5": 0.08041177968775373}, "score": 2.3384255172336474}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7856655075845785, "4": 0.1654589584689959, "3": 0.039118968568460685, "2": 0.004921873639181364, "1": 0.004757822373384003}, "score": 4.722484861570423}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.814730976839808, "4": 0.11833656129471459, "3": 0.051930343836206774, "1": 0.007896876321839975, "2": 0.006960400243773055}, "score": 4.72529425623219}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6575928290690325, "4": 0.24933525063319692, "3": 0.06998352652399444, "2": 0.011800893854477306, "1": 0.01116125358424457}, "score": 4.53059073921959}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8028425110392446, "4": 0.12401906192375922, "3": 0.04840194887779804, "1": 0.014882473999353584, "2": 0.009673704024447708}, "score": 4.690570242022628}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2977324841050667, "2": 0.2929265453087989, "1": 0.2254577046858863, "4": 0.1410816328149522, "5": 0.04262973348681301}, "score": 2.48241017162433}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3911493314669585, "3": 0.336209870307048, "5": 0.13274596696494118, "2": 0.10166420545248006, "1": 0.03802879663734514}, "score": 3.479016146101442}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.42255735074020645, "5": 0.3511411498593496, "3": 0.18591539022998152, "2": 0.02716105046839496, "1": 0.0130016500844812}, "score": 4.071914774819561}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7653370759838088, "4": 0.19445803452505067, "3": 0.034836287194450505, "2": 0.003247332788644831, "1": 0.002005915528000034}, "score": 4.718071208999982}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4134182031197841, "5": 0.2750027723757552, "3": 0.21975414066011284, "2": 0.057988874836384506, "1": 0.03374502769746082}, "score": 3.8380210618944286}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.40870762167701163, "4": 0.2652697357288785, "3": 0.16098631783503004, "1": 0.11079598962989884, "2": 0.05408062988680915}, "score": 3.807141274629188}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6535936832717186, "4": 0.27944248101445995, "3": 0.055587945988379704, "2": 0.005902906631355743, "1": 0.005364733381680818}, "score": 4.570167444337457}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8289041017261902, "4": 0.11814511759339294, "3": 0.04486892129303843, "1": 0.004243883538727779, "2": 0.0037818234177993382}, "score": 4.763782771240616}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.924717447772739, "4": 0.06583291090253576, "3": 0.008292125080859523, "1": 0.0006639867921672881, "2": 0.00045623341701345237}, "score": 4.9135549674591035}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2558675119278696, "5": 0.25229975358757234, "3": 0.22442401328161057, "1": 0.16305332246241758, "2": 0.10425285839729735}, "score": 3.330141368590133}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"3": 0.40329137636976453, "4": 0.21564162342999987, "2": 0.19065148567995702, "1": 0.09564058688633283, "5": 0.09471837157321306}, "score": 3.0231470162278593}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3524936750540046, "3": 0.2859643289191193, "5": 0.20376463524855806, "2": 0.09520591564378346, "1": 0.06250178891558758}, "score": 3.539851056059522}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5309098745093138, "4": 0.3382033625761878, "3": 0.11587464717229982, "2": 0.009834467224363982, "1": 0.005095917754853443}, "score": 4.380109606271863}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8941981134029642, "4": 0.09501344225218376, "3": 0.009765026508627355, "2": 0.0005544025003987476, "1": 0.0004095494110686141}, "score": 4.882148091412362}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8142468853578599, "4": 0.16108570925943624, "3": 0.022271984294462147, "2": 0.001308285732343389, "1": 0.001025610739932127}, "score": 4.786329876022559}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5028411821457998, "2": 0.2649544114657153, "3": 0.17213476353967316, "4": 0.04264512133419844, "5": 0.017299240157063616}, "score": 1.8064572972409156}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.453629270195857, "2": 0.25832329425510153, "3": 0.19845434605358386, "4": 0.05399796058907664, "5": 0.0354665351119185}, "score": 1.9592153577197289}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3561010642770924, "2": 0.20269913356560362, "1": 0.18232320777444996, "4": 0.16648026585158454, "5": 0.09225988936671455}, "score": 2.783624973442656}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.37168524442694617, "3": 0.2104020825744565, "2": 0.2014417744295432, "4": 0.13620928714994776, "5": 0.08016729021379689}, "score": 2.351670453069802}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.530385350612909, "2": 0.24426162366004206, "3": 0.14726781191453867, "4": 0.051215938323406256, "5": 0.02679103399140589}, "score": 1.7996717659415955}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29173874094742097, "4": 0.2617863934311595, "2": 0.18463290915926633, "1": 0.14125036851545733, "5": 0.12040583305262613}, "score": 3.0354710022584976}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4291334054413563, "5": 0.3466595515848241, "3": 0.17918652080365166, "2": 0.031158443845503085, "1": 0.013727804188451606}, "score": 4.063981321561498}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5081708850884568, "4": 0.2445514653472005, "3": 0.16337812164211515, "2": 0.04860943165154581, "1": 0.035099183882200145}, "score": 4.142303516000777}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.914741835968442, "4": 0.07459423899668156, "3": 0.008794075701043447, "2": 0.0009917320480691116, "1": 0.0007288706329016344}, "score": 4.901912291663262}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4582747426221584, "4": 0.411103652671918, "3": 0.10204041690654969, "2": 0.017836577756938112, "1": 0.010603904464279376}, "score": 4.288790091185641}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.438924553756971, "2": 0.2556881605164593, "3": 0.17208510982328498, "4": 0.08861173331033301, "5": 0.0446409937380421}, "score": 2.0443091949400585}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.39990674362229195, "4": 0.2076747552046921, "2": 0.20559968037472015, "1": 0.12761713886083462, "5": 0.059152312133379084}, "score": 2.8651387633022263}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.34632480551716227, "4": 0.21169563920302145, "2": 0.16672308775253789, "5": 0.1639136523293481, "1": 0.11130794940785374}, "score": 3.150189193758374}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8300147560301069, "4": 0.1432342753633435, "3": 0.023217348490382216, "2": 0.0018340834583400593, "1": 0.0016602650843420394}, "score": 4.7981797911463415}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3242610752026156, "3": 0.2580884302190041, "5": 0.17470299819954668, "2": 0.13788418297498903, "1": 0.10500403510411607}, "score": 3.3257941309406314}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8929439464576466, "2": 0.09229576698585754, "3": 0.01325812111454342, "4": 0.0009261960765488123, "5": 0.0005624878635666347}, "score": 1.1238422184779535}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8589313488846185, "2": 0.119139357453692, "3": 0.01786518557377216, "4": 0.0028460286858735676, "5": 0.0011884962813842619}, "score": 1.1681667746823803}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.8263439729517371, "2": 0.1450446866858739, "3": 0.025813829591226283, "4": 0.002017599178339868, "5": 0.0007647508220556531}, "score": 1.2057872665851441}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9365535853452556, "2": 0.055981667943060524, "3": 0.006669869396372888, "4": 0.00042900241915337515, "5": 0.00032312219292889103}, "score": 1.0719039768543654}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8916975619540232, "2": 0.09595971605580142, "3": 0.010721217039279108, "4": 0.0010914563211988975, "5": 0.00050703054988753}, "score": 1.1227074657877472}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"4": 0.41913278498209106, "5": 0.39190988532270254, "3": 0.13821294547530866, "2": 0.02920536072748925, "1": 0.021444222869011383}, "score": 4.130965965440549}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9415835042880579, "4": 0.05365304793800201, "3": 0.0041580544266897924, "1": 0.00030384769056127385, "2": 0.0002370968145575084}, "score": 4.936100043724507}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7917458540621674, "4": 0.14974422604880686, "3": 0.04818942405245945, "1": 0.005274269988513636, "2": 0.004932240163077116}, "score": 4.717950975851774}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9232069879380149, "4": 0.07101175161022866, "3": 0.0051689174660379264, "1": 0.0003138742907960092, "2": 0.00024602903513320937}, "score": 4.91665245847239}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8711198422788003, "4": 0.11560549375972845, "3": 0.011412530049848798, "1": 0.0010757986102019142, "2": 0.0007423990916684268}, "score": 4.855032685110406}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3667292285867117, "4": 0.23558575304020968, "2": 0.16058506127642752, "1": 0.11975395692763412, "5": 0.11719673038116553}, "score": 3.0698966721322662}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3363382933773427, "3": 0.2660101800681119, "5": 0.23536694843084943, "2": 0.09417322250169959, "1": 0.06795408652613699}, "score": 3.577081551778953}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4301379662552719, "4": 0.2693033875903289, "3": 0.17263578374630603, "1": 0.07752771450753337, "2": 0.050275052453112375}, "score": 3.9243598500424866}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5188626367097539, "4": 0.29713030470964424, "3": 0.1452033071987405, "2": 0.02222475325013346, "1": 0.016496703597572177}, "score": 4.279742733515969}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2612391258787545, "4": 0.23661384799703541, "1": 0.20242901441296654, "2": 0.16227358043466833, "5": 0.137357000419043}, "score": 2.9441913601772827}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.42389529500043227, "2": 0.3226812774646928, "1": 0.15563869743340136, "4": 0.07331727665327789, "5": 0.0243734708116138}, "score": 2.488057432232713}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.40518209323308635, "5": 0.2646949892100098, "3": 0.22991178203616466, "2": 0.05967892117956108, "1": 0.04038293436362794}, "score": 3.7942458467484603}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.607717514069646, "4": 0.2938774897553711, "3": 0.07835367549881987, "1": 0.010225813707745505, "2": 0.009737722677605132}, "score": 4.479253022979122}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6097848432605493, "4": 0.3289830991174337, "3": 0.05194507337026792, "2": 0.0055037863297919655, "1": 0.003600696428026352}, "score": 4.536127952098815}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6398311663554803, "4": 0.27600375728671084, "3": 0.07231050955556181, "2": 0.006913139519705303, "1": 0.004878216486484767}, "score": 4.539093804849607}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27235331592295664, "1": 0.21675952925939945, "4": 0.21371915193776192, "2": 0.1598607748088101, "5": 0.13726191362385562}, "score": 2.894858381423539}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.33122979492330895, "4": 0.2623994284703845, "2": 0.14383513947807286, "5": 0.1426945710103317, "1": 0.11980821775927283}, "score": 3.1643423938723214}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33131251333006456, "1": 0.2325372852838153, "2": 0.20582258893842262, "4": 0.15156272701811138, "5": 0.07868356314077204}, "score": 2.638003255389787}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.36190037942066106, "4": 0.27222177381258933, "3": 0.1955380674690775, "1": 0.0983568585925005, "2": 0.07193416163793445}, "score": 3.727410121670007}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.2402878978931596, "4": 0.23610055126833068, "3": 0.23476283199551223, "2": 0.1480672968678619, "5": 0.14072791974080853}, "score": 2.8889073543910095}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.31598241995392506, "3": 0.30454342230866016, "5": 0.16561845500059608, "2": 0.12397793162275667, "1": 0.08980884606560152}, "score": 3.3436473921143115}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.510714404664428, "4": 0.2881370338585431, "3": 0.1419675029551657, "2": 0.03395458440748161, "1": 0.02516868540107591}, "score": 4.2253446990712815}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5211188469994154, "4": 0.3055009777147483, "3": 0.1388038907447596, "2": 0.02267264153675503, "1": 0.011847069992395484}, "score": 4.301445516884781}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6433879969555814, "4": 0.28462791872998733, "3": 0.05674833285820872, "2": 0.007809900931797868, "1": 0.007385413298310693}, "score": 4.548885817758768}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7558032409277972, "4": 0.17792707564900306, "3": 0.04851848110062785, "2": 0.009221652753950267, "1": 0.008455760955761336}, "score": 4.663523131903489}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"1": 0.38941681700867575, "2": 0.37616723896430626, "3": 0.18541283491690974, "4": 0.04210124358053557, "5": 0.006700249596969987}, "score": 1.9002791485477495}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3656859405047299, "3": 0.3169695710787734, "5": 0.17980022599878417, "2": 0.09034251589162011, "1": 0.047057453919715844}, "score": 3.5409070176546313}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5200923432497984, "4": 0.336954254893285, "3": 0.1252454583942417, "2": 0.01159614805777715, "1": 0.0060266378151913255}, "score": 4.353604787425835}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.49554859865071527, "4": 0.3586178651120588, "3": 0.12088915833873205, "2": 0.015923642889897234, "1": 0.008768513370700618}, "score": 4.316586464376668}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3627219921445675, "3": 0.29692443504782273, "5": 0.20504604813897329, "2": 0.0859742711641101, "1": 0.04907363273161941}, "score": 3.5888454283003832}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9229891958676141, "2": 0.0683973498491297, "3": 0.007668264196279989, "4": 0.0005048410150191199, "5": 0.00041894554947798}, "score": 1.0869260440081958}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.607911966159645, "2": 0.19581976678952628, "3": 0.12445826999824264, "4": 0.04728481835571467, "5": 0.024354398724451293}, "score": 1.6841251916323197}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.43017017189040835, "3": 0.2147762909, "2": 0.1905725341865714, "4": 0.09277865281250011, "5": 0.07145392804358765}, "score": 2.1845710603081097}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.4633021712881202, "3": 0.19868122958326148, "2": 0.1797069518635807, "4": 0.0827850739620199, "5": 0.07531515521137243}, "score": 2.126921251459568}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.24674972874011283, "3": 0.22956434922572735, "5": 0.22588849193243654, "4": 0.1834254978862086, "2": 0.11412807457656134}, "score": 3.027581675696608}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6457697260305294, "4": 0.2710376873660663, "3": 0.06914799612229068, "2": 0.008307544509507108, "1": 0.005632767469318407}, "score": 4.543164978911765}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5032208196241484, "4": 0.34912645051851476, "3": 0.12345725452907015, "2": 0.016677969868173877, "1": 0.007429557335662895}, "score": 4.324147461513021}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6373645277641768, "4": 0.2835493491179885, "3": 0.06793667891917868, "2": 0.006632363849121619, "1": 0.00445453455727007}, "score": 4.542833469424357}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8626901936582233, "4": 0.1221416795815464, "3": 0.013677173549685492, "2": 0.0008281502157878529, "1": 0.0005579250073750766}, "score": 4.84577164748301}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.41108143723079427, "5": 0.331704090890989, "3": 0.1717077800884748, "2": 0.05405725588316399, "1": 0.03136062041669479}, "score": 3.957796189433992}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2621753563646701, "3": 0.21617230088512307, "4": 0.19924907574352235, "2": 0.19568765261586263, "5": 0.12640255296063097}, "score": 2.731931894535096}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8256299733368714, "4": 0.11558628172323002, "3": 0.051020636032981896, "2": 0.004686248078235591, "1": 0.002963555941736262}, "score": 4.75643188075094}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6534882540428835, "4": 0.21635417825888326, "3": 0.11330889563962634, "2": 0.010363609453308158, "1": 0.006396109270264089}, "score": 4.500308315779083}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.723158229105053, "4": 0.1951093126092342, "3": 0.06045807072986171, "1": 0.011906854932105193, "2": 0.009263521602268255}, "score": 4.6085158427287265}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9024756587977862, "4": 0.07800670456695086, "3": 0.01557003570417204, "1": 0.0021342151737502786, "2": 0.0017367436233452689}, "score": 4.877096712889469}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"3": 0.41696435101933854, "2": 0.32524107577942596, "1": 0.16128754712888738, "4": 0.07167091945862994, "5": 0.02474576291442021}, "score": 2.4732986911055987}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4695000846667359, "4": 0.3556065698924433, "3": 0.13618272892846428, "2": 0.02190392794550962, "1": 0.01669458272348175}, "score": 4.239452595711995}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.785368990536924, "4": 0.16830775506994577, "3": 0.03832825984177443, "1": 0.004393065517640019, "2": 0.0035015274198941185}, "score": 4.726931464394604}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6096090371490593, "4": 0.3290727592275784, "3": 0.053288283166323995, "2": 0.004781614633890336, "1": 0.00310978278276609}, "score": 4.537502632865574}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6416258713925757, "4": 0.26840825983772243, "3": 0.07425035649733094, "2": 0.008008522434690336, "1": 0.007650785168539932}, "score": 4.528435815080393}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"3": 0.30103233342071534, "4": 0.2355450473391582, "1": 0.15939233505688294, "2": 0.15861595116941773, "5": 0.14526546751558045}, "score": 3.0486826082478684}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6299684312368004, "4": 0.2178213167987621, "3": 0.11759077387960021, "1": 0.018174908317580667, "2": 0.016354617591726475}, "score": 4.425181943261798}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.841466521884061, "4": 0.10940551269486004, "3": 0.03916794877190378, "1": 0.005496879562618955, "2": 0.004298278866560736}, "score": 4.777339527502015}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.918619499412239, "4": 0.06581549381869277, "3": 0.012934945198972597, "1": 0.001607137713308802, "2": 0.0009451262892325093}, "score": 4.899042831840319}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6511699701445561, "4": 0.2418225950414223, "3": 0.07937815297805723, "1": 0.015067829569111362, "2": 0.012458595408834799}, "score": 4.5017227432664635}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.36961904938461004, "2": 0.3549259864914508, "1": 0.1718547217615562, "4": 0.08762425813723987, "5": 0.01585099982827632}, "score": 2.4206184141211624}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6752094094504666, "4": 0.26606354706276414, "3": 0.052743749844827756, "2": 0.003400645542299384, "1": 0.0025008390085255253}, "score": 4.608211608734382}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7067337537063954, "4": 0.21911512551668416, "3": 0.06527109434786024, "2": 0.005113714146195996, "1": 0.003694393052185053}, "score": 4.620196655975955}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9476459404749384, "4": 0.048837207884297434, "3": 0.003205173679199135, "1": 0.00016422501957327884, "2": 0.00011852329908080123}, "score": 4.943738347152243}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7152431100670692, "4": 0.23764039341206156, "3": 0.0396741752672735, "1": 0.0037083360760100537, "2": 0.003672340800268085}, "score": 4.657139753942172}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3158921566712682, "5": 0.27938067517363757, "3": 0.2745717686303338, "2": 0.07495559555865715, "1": 0.055124445732770394}, "score": 3.689500979570047}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7886436640497223, "4": 0.18505540726775252, "3": 0.023348475174939827, "2": 0.0016233148770404173, "1": 0.001281419668051175}, "score": 4.7582404825656965}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4106194359635241, "5": 0.40594008668957465, "3": 0.15323050847805783, "2": 0.018574542844752878, "1": 0.011551182110754333}, "score": 4.180922187782857}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9524122140077628, "4": 0.04411016606852049, "3": 0.0030941563339654224, "1": 0.0001987640728786346, "2": 0.00013450515937401362}, "score": 4.948500364502797}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8844513143755949, "4": 0.10533368662859707, "3": 0.00905405459549823, "1": 0.0005770590251890476, "2": 0.0005405502260718381}, "score": 4.8726227974913785}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2770678380696691, "3": 0.25783627204085274, "1": 0.16297207693456964, "2": 0.15811047206342047, "5": 0.14366880409008012}, "score": 3.0803785136732724}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.24487338449576018, "3": 0.23517103995070684, "1": 0.20574480270232873, "2": 0.1618795077195361, "5": 0.15200242565600525}, "score": 2.97550106646712}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3596257397890975, "2": 0.20877156817282358, "4": 0.2061791763772646, "1": 0.14704500244099672, "5": 0.07827023411886525}, "score": 2.859842895474908}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5257148886429261, "4": 0.38483256322707116, "3": 0.07694331477416808, "2": 0.00808144650157169, "1": 0.004361726123864443}, "score": 4.419551218353945}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5437080222603968, "4": 0.3620667832700751, "3": 0.07682309253311172, "2": 0.009658286765061565, "1": 0.0075961632096531746}, "score": 4.424842595410829}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.31831121858382544, "3": 0.2905778942728602, "5": 0.15127894930836785, "2": 0.1307338502393132, "1": 0.1089779184830453}, "score": 3.272212141486636}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.534215613989397, "4": 0.36334575679422376, "3": 0.08292384686532522, "2": 0.012789560842315462, "1": 0.006651329629598805}, "score": 4.405788641035864}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8245035758498118, "4": 0.12716729193725987, "3": 0.04215770970962997, "2": 0.0036437022958470885, "1": 0.0024452766822090515}, "score": 4.7677859304806}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6178588967530766, "4": 0.30101072007510415, "3": 0.07056301066775894, "2": 0.007217268657045904, "1": 0.0032512231486919742}, "score": 4.523159409692914}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7627302110018919, "4": 0.19703758138231223, "3": 0.034966902771068675, "2": 0.003417948369068869, "1": 0.0017525833141751376}, "score": 4.715737494255283}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8559579995418081, "4": 0.11084013954624675, "3": 0.029195622363649063, "2": 0.002238625091509106, "1": 0.0015985616864490238}, "score": 4.817627663339759}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9620737019475349, "4": 0.032599315101063564, "3": 0.004753728602096939, "2": 0.0002629180950381561, "1": 0.00023320200634201755}, "score": 4.956168284457847}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6207289287467774, "4": 0.25017415090889616, "3": 0.10191949928440226, "2": 0.016636087457369976, "1": 0.01044504683520934}, "score": 4.454245851906668}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5130424647226908, "4": 0.3141476125109111, "3": 0.11588166938868945, "2": 0.032634844882785535, "1": 0.024134256891645004}, "score": 4.259529639451712}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6176656545372078, "4": 0.2850336031141867, "3": 0.07423019283885503, "2": 0.012811757179478776, "1": 0.009979522854221051}, "score": 4.488009664980178}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3146979150916422, "3": 0.23731412345801992, "4": 0.18617976379242826, "1": 0.13450652071002325, "2": 0.12721928855358802}, "score": 3.4193778158669317}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5134418646226617, "4": 0.34150778627895945, "3": 0.11891720313583845, "2": 0.016779825118796148, "1": 0.009196374028064934}, "score": 4.33342821966237}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8014874862241118, "4": 0.14230556032265582, "3": 0.046842357996783324, "2": 0.005106934280056897, "1": 0.004174173100734681}, "score": 4.7319698511193184}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7689981616896204, "4": 0.19595888738377568, "3": 0.02945142449810016, "2": 0.0030264256780399394, "1": 0.0022952885810448545}, "score": 4.726804120688852}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7375512290957051, "4": 0.1993013655611215, "3": 0.048802067510600025, "2": 0.007344033970954603, "1": 0.006897450006224043}, "score": 4.653436605535264}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"2": 0.31066019025519354, "3": 0.29957610106403965, "1": 0.2387522680453575, "4": 0.12349104940425247, "5": 0.027458725299104796}, "score": 2.3902061701516764}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3341076942844482, "4": 0.21981139407068775, "2": 0.1939173968550145, "1": 0.1721053138011285, "5": 0.07998161365784406}, "score": 2.8416344681357164}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.40158577180686406, "2": 0.26686146844598596, "4": 0.15253236133067694, "1": 0.14613183284637274, "5": 0.03282225130998025}, "score": 2.6590291185801815}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.39591608371275083, "5": 0.3700592318778267, "3": 0.18240184249406946, "2": 0.03073935879708315, "1": 0.020813380621343146}, "score": 4.063742998468916}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31827977098896615, "2": 0.2313753257967004, "1": 0.22015289428272458, "4": 0.1741695550377481, "5": 0.05587121325877724}, "score": 2.6141725143991983}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4190549592502627, "2": 0.25526475947621835, "3": 0.18827393041176937, "4": 0.09837355116772858, "5": 0.038789437453278}, "score": 2.0823544278148858}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5838533153785254, "4": 0.23696277919280695, "3": 0.12320390893716165, "2": 0.029560253711675935, "1": 0.026300861070793966}, "score": 4.322664674733608}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5884401245139913, "4": 0.30372973579041906, "3": 0.08764466820362003, "2": 0.011611159702708318, "1": 0.00843220647845618}, "score": 4.452340797499205}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4965784013036592, "4": 0.3585504154354721, "3": 0.10807688575535551, "2": 0.021802158507132897, "1": 0.014781479011965854}, "score": 4.3006160892794245}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.713336921148192, "4": 0.23832301967106734, "3": 0.04204228842448349, "2": 0.003925705102236047, "1": 0.00228315778685729}, "score": 4.656652130699073}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3337601358969966, "2": 0.2563922963048269, "4": 0.19371861712446978, "1": 0.14979925218513948, "5": 0.06609588422157092}, "score": 2.7698657762276637}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6480847786095102, "4": 0.2621852667804463, "3": 0.0731765474044874, "2": 0.008572233173321855, "1": 0.007897700008994878}, "score": 4.53411524958015}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.32515694679567503, "3": 0.3230471148462145, "5": 0.21553219151811573, "2": 0.09052543663304038, "1": 0.04564806776500811}, "score": 3.5744515975837956}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7587023039008305, "4": 0.1788696769569546, "3": 0.05091926193486508, "1": 0.00588625268652343, "2": 0.005579011883945142}, "score": 4.678995791455906}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5498515974403931, "4": 0.2946440680769908, "3": 0.11928811233279081, "2": 0.022227064744667114, "1": 0.013879765761756807}, "score": 4.344507744601345}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"5": 0.2824642175381275, "3": 0.2514767346709102, "4": 0.1686004945743902, "2": 0.1550710468975536, "1": 0.14229060479419267}, "score": 3.293905153022188}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5100493975566391, "5": 0.3471805560237044, "3": 0.11675763364861852, "2": 0.01732745051571331, "1": 0.008590103449872431}, "score": 4.170013838303653}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3970141724760589, "5": 0.3335704138268216, "3": 0.23574456778580163, "2": 0.025815324255229716, "1": 0.007731441132960321}, "score": 4.023003728446339}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7269866389159241, "4": 0.22910407561589918, "3": 0.03822817002239767, "2": 0.003282524788835487, "1": 0.0021766212278353674}, "score": 4.675813565583685}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7549381376330438, "4": 0.21516556014556898, "3": 0.02748278693284844, "2": 0.0014882624208833076, "1": 0.0008160341119611222}, "score": 4.722109591433597}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5002022511744827, "2": 0.36019627059505605, "3": 0.11677344370253105, "4": 0.01816102072617635, "5": 0.0045830140856665995}, "score": 1.6666142719308956}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.2761136286450609, "3": 0.2745188088443006, "2": 0.2518405575121974, "4": 0.13831320002496725, "5": 0.05902110424309248}, "score": 2.452182028785664}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.42600780980722586, "5": 0.2952953018829595, "3": 0.23959123385307157, "2": 0.029571953018624867, "1": 0.009346727471453566}, "score": 3.968514092533264}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5663290552552106, "4": 0.26204867762932116, "3": 0.11163151236851675, "1": 0.03229775357286071, "2": 0.02758376786784833}, "score": 4.302669808056249}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3445236984631238, "4": 0.2824907986716205, "3": 0.26105506941195317, "2": 0.06988845555241777, "1": 0.041704610197221166}, "score": 3.8185166607372514}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7198004774702798, "2": 0.1848621623469648, "3": 0.06563938382447469, "4": 0.02040947551383254, "5": 0.008986718624184044}, "score": 1.4134410001771296}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7146186179970446, "4": 0.22783322203364276, "3": 0.05073031084413384, "2": 0.0041205843217892914, "1": 0.0025969619446238883}, "score": 4.647921241028191}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.48544052564538154, "4": 0.3614492263300541, "3": 0.12649569538128388, "2": 0.018120072088158932, "1": 0.008329602858419575}, "score": 4.297764972315314}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.790341530385061, "4": 0.16975017187931757, "3": 0.0327271752109568, "2": 0.003968409080457737, "1": 0.003117462217407387}, "score": 4.740395673957229}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.843385095288307, "4": 0.12298869972311778, "3": 0.02823864073863775, "2": 0.003076432292467705, "1": 0.002242188233514121}, "score": 4.802322340354149}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4436664223195956, "2": 0.2674394482371606, "4": 0.17618536992499526, "1": 0.08596996396102113, "5": 0.026640229992369834}, "score": 2.7900657614637283}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.47644863887383815, "4": 0.41831823850096694, "3": 0.09343238120388636, "2": 0.008957784035946314, "1": 0.0027999268139992208}, "score": 4.356716258860494}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.39275257717363166, "4": 0.2790397874445761, "2": 0.18244427409723776, "5": 0.07863355203154349, "1": 0.06705798406882998}, "score": 3.1197552507157047}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6372952053946573, "4": 0.2953269887688226, "3": 0.05684435841690432, "2": 0.006663709283461087, "1": 0.003769828761147835}, "score": 4.55586947869959}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5527799373331267, "4": 0.34906773238787075, "3": 0.08374046211134908, "2": 0.00942640014672327, "1": 0.004926593516704469}, "score": 4.4354325302525615}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.29448691739034477, "4": 0.24463139782633167, "2": 0.23253526221823367, "1": 0.1507598960635594, "5": 0.07747719066048314}, "score": 2.8655160208829815}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3176701495818368, "4": 0.29291614660101856, "2": 0.15831265059012634, "5": 0.12134431449852905, "1": 0.10963988022357903}, "score": 3.158030831807527}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3645223910236387, "4": 0.2845956437540291, "5": 0.20567113867881165, "2": 0.09664502973993465, "1": 0.048406256842949774}, "score": 3.5025605561771687}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.603128622915741, "4": 0.310695048284039, "3": 0.07558736797768813, "2": 0.007292980272316124, "1": 0.0032387040945676933}, "score": 4.503268007517428}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3671885876879333, "3": 0.31227211744342626, "5": 0.1398582457059617, "2": 0.1207586685249093, "1": 0.05985175045724024}, "score": 3.4064716188242845}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3247332509412895, "4": 0.31392687574110323, "2": 0.15896088711667936, "5": 0.12294914062183944, "1": 0.07920589112789997}, "score": 3.242506798089178}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.34943448094127777, "4": 0.28298066647933623, "2": 0.168970641176397, "5": 0.0999244378619773, "1": 0.09853243457314058}, "score": 3.116812411024798}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4251120065313067, "4": 0.2531888312682431, "3": 0.21044290453807837, "2": 0.061935101014579316, "1": 0.049198000330444705}, "score": 3.9431979034357054}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3295095638893355, "3": 0.29973476861307957, "5": 0.1684293339906682, "2": 0.12870081909831976, "1": 0.07351104587803246}, "score": 3.390690042731385}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2888669435005625, "4": 0.2764907257979986, "2": 0.16991234373507483, "5": 0.15686322996851249, "1": 0.10779992675070539}, "score": 3.2047186698978427}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"1": 0.44394381826295143, "2": 0.28810113422071826, "3": 0.1876691888317627, "4": 0.06250430778843584, "5": 0.0177078594718572}, "score": 1.921851805709513}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6626092692533221, "4": 0.2984598085316486, "3": 0.036250746673642524, "2": 0.001894343762302139, "1": 0.0007487528516457233}, "score": 4.620346578285902}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7198489864589485, "4": 0.24799380821595043, "3": 0.03028004694653867, "2": 0.001185484532240832, "1": 0.000669195441995017}, "score": 4.685205786454659}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8869321352748696, "4": 0.10254890215313382, "3": 0.009568031400063827, "2": 0.0005012863817161914, "1": 0.0004182401788095235}, "score": 4.875134293827372}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8934718948479364, "4": 0.09466071511205311, "3": 0.010885177256001133, "2": 0.0004965084775512212, "1": 0.0004489594437614324}, "score": 4.880279168042713}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"1": 0.83291456924824, "2": 0.10252799456358601, "3": 0.04088336591514499, "4": 0.013427754268026944, "5": 0.009955809787227998}, "score": 1.264478060868016}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.30480309531142474, "5": 0.2514794757822571, "3": 0.24302691025084047, "2": 0.11613790009608461, "1": 0.08446512936732195}, "score": 3.522739622112413}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4608853663142568, "4": 0.3366780993251433, "3": 0.1547974176210837, "2": 0.032129399362715125, "1": 0.01538797990470218}, "score": 4.195689032941824}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5494606820102977, "4": 0.3282832421817174, "3": 0.1046476171560606, "2": 0.012141347534060806, "1": 0.005375260183002232}, "score": 4.4044417375888045}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.48911690429086796, "4": 0.3368740693230818, "3": 0.13044181678893144, "2": 0.028650983738171414, "1": 0.014764531422239473}, "score": 4.257118529209331}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.295141138931766, "4": 0.24220388682364127, "2": 0.2223431432820789, "1": 0.15946895742399125, "5": 0.08077317186204942}, "score": 2.862459585620213}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6716116078861232, "4": 0.25738812996899885, "3": 0.05342187354171679, "1": 0.00969328404271256, "2": 0.007836413586373388}, "score": 4.57346497761188}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.36156530631227246, "4": 0.3113999749579103, "5": 0.16230144520055068, "2": 0.11444693651018961, "1": 0.05024346451019646}, "score": 3.421087052886843}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5978430187170649, "4": 0.253245526594369, "3": 0.09604270909890573, "1": 0.027624657980976335, "2": 0.02519690775824887}, "score": 4.368549908288283}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6445160847312751, "4": 0.29998632160962085, "3": 0.04798595572256601, "2": 0.00439559797095417, "1": 0.0030792457449187877}, "score": 4.578522482115911}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6288071292912732, "4": 0.23513214587732756, "3": 0.10295642896581138, "1": 0.02029425374001001, "2": 0.012714095742729626}, "score": 4.439581923915537}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5030748564373594, "4": 0.3081923123847047, "3": 0.14915889975090138, "2": 0.022908446354141125, "1": 0.01662302161704224}, "score": 4.258240964930862}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4642637321374614, "4": 0.298557510415022, "3": 0.1803642070234853, "2": 0.03085673617358136, "1": 0.02587280142729767}, "score": 4.14457993963376}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9523915602204397, "4": 0.03948543536529709, "3": 0.006757803282146456, "1": 0.000861900864754116, "2": 0.000449638783892116}, "score": 4.942199336590372}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5285192766871135, "4": 0.3053670143662325, "3": 0.1203171627411358, "2": 0.023187081205405347, "1": 0.022547668744417087}, "score": 4.294203125953514}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6180975846658009, "2": 0.25145805064364435, "3": 0.10130565955888755, "4": 0.015632951762685605, "5": 0.013476651626682271}, "score": 1.5548909798505048}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4374340619876429, "3": 0.26238423598330285, "5": 0.2023290998744841, "2": 0.06760313643784399, "1": 0.030033747887374215}, "score": 3.7145757762593807}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6656942619406865, "4": 0.26558344337855416, "3": 0.058083241446131056, "2": 0.006451362049517313, "1": 0.004091461654628746}, "score": 4.582489964167396}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6761254319023959, "4": 0.2470955932548243, "3": 0.061944924700597925, "2": 0.007954627056007834, "1": 0.006782639133774081}, "score": 4.577979274807081}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6400970586411162, "4": 0.2555797972744282, "3": 0.07884760028195534, "2": 0.013690323631068816, "1": 0.011735932379022944}, "score": 4.498685593071943}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5556410259640635, "4": 0.34824288404441667, "3": 0.07764881424598839, "2": 0.011241601077988177, "1": 0.0071367299338443374}, "score": 4.4341374339990205}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7757578162276938, "4": 0.18341709719078278, "3": 0.03393367143093209, "2": 0.003645079875661099, "1": 0.0031605822880133166}, "score": 4.725114418908678}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.2728388093822104, "4": 0.23600884401944952, "2": 0.21136658147413576, "1": 0.1947660858908334, "5": 0.08489101683822654}, "score": 2.804867018163285}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6629845448520698, "4": 0.2573487268626854, "3": 0.06420338139302073, "2": 0.00883637547987447, "1": 0.006558712241144579}, "score": 4.561470601293768}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3493244613467237, "4": 0.24193673805394794, "2": 0.24168216108895327, "1": 0.11964227859186552, "5": 0.047327895521366285}, "score": 2.8556133263729184}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3952555900178121, "4": 0.29478417516777133, "3": 0.2076848484430588, "2": 0.054623275273792425, "1": 0.047547403364961355}, "score": 3.935675245633105}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7671037649489928, "4": 0.16035267030560477, "3": 0.051968609819107815, "1": 0.012527989222588303, "2": 0.008011293862882171}, "score": 4.661552198521078}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.33462961020777243, "4": 0.2108708116668067, "2": 0.1898077046710136, "1": 0.15218090520490585, "5": 0.11244107188931067}, "score": 2.941579356974295}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.38686371716533474, "4": 0.2350070653431335, "3": 0.1827268617242846, "1": 0.1130211849960975, "2": 0.08228639457263182}, "score": 3.70047212319398}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5234439616290986, "4": 0.20874964830897846, "3": 0.12758005870828876, "1": 0.09977363589024832, "2": 0.04036420102855306}, "score": 4.015815992820305}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5105555920748651, "2": 0.21018442907410798, "3": 0.16041217218320394, "4": 0.08331745566179492, "5": 0.03536338203500926}, "score": 1.9225687089139596}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.27718054447670637, "4": 0.26849327819555935, "3": 0.25734803202206086, "1": 0.10852164856061318, "2": 0.08839051601430752}, "score": 3.5174546960524147}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.35277179647828627, "4": 0.26991880160765486, "3": 0.19998380314270092, "1": 0.11126401370290635, "2": 0.06598690273878112}, "score": 3.686998771088339}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8051514843099922, "4": 0.16246888052714528, "3": 0.02875150975212936, "2": 0.0019921317150353433, "1": 0.001590354232225903}, "score": 4.7676796849200525}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.2947603280926275, "3": 0.21695248772302378, "4": 0.210979417005779, "2": 0.16149562927473152, "5": 0.11569122388419727}, "score": 2.691308254154367}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6206465014183355, "2": 0.23499641976419763, "3": 0.10480084962702044, "4": 0.027836649477115782, "5": 0.011677266050497528}, "score": 1.5748414552990984}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.958829999808246, "4": 0.03774144694317204, "3": 0.0031652317605017225, "2": 0.00013517720643846696, "1": 0.00010892826626974747}, "score": 4.955085981782966}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8633694326072894, "4": 0.12337670027078103, "3": 0.012560692300431497, "2": 0.00038768139599789736, "1": 0.0002686231741625098}, "score": 4.849258820378533}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9034464050208639, "4": 0.08801726416959915, "3": 0.0074427594878393, "1": 0.0005047270852594871, "2": 0.0004813696884553362}, "score": 4.893622766603243}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.949110673492161, "4": 0.04619148524206371, "3": 0.004008968510718634, "1": 0.00030704353887282164, "2": 0.00029491629135796417}, "score": 4.943672759141684}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.27260007079960075, "4": 0.22874500754604413, "1": 0.18361432150463625, "2": 0.1710187977771208, "5": 0.14372414160108907}, "score": 2.9779392833518914}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.32813453073780663, "5": 0.270366941514516, "3": 0.24862279764176867, "1": 0.08247959084028758, "2": 0.07012178941014052}, "score": 3.6339613698863324}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6437460905208192, "4": 0.24493289595854256, "3": 0.08511637850949653, "1": 0.013859085065354408, "2": 0.012178526512546185}, "score": 4.492777709214986}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7404578114174599, "4": 0.18065582088760834, "3": 0.05665633900856909, "1": 0.0127366119779757, "2": 0.009381130507863107}, "score": 4.626899767652255}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7548688148468695, "4": 0.17181734742417956, "3": 0.049448576894646344, "1": 0.015571499356318803, "2": 0.008104423137384095}, "score": 4.642618565941414}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6476146600028282, "2": 0.25091127208868974, "3": 0.07694791612197048, "4": 0.01830024740183846, "5": 0.00610236608636124}, "score": 1.4841771253017324}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2941988440359852, "4": 0.2652709294453751, "2": 0.15554933979096838, "5": 0.1479304867020381, "1": 0.13664383266116892}, "score": 3.132348706400897}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3430097179506186, "5": 0.2664055785585647, "3": 0.262041314164937, "2": 0.07555908092010717, "1": 0.05256544049414568}, "score": 3.6954222032053057}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6398011973655275, "4": 0.24987777016997825, "3": 0.08449302435824858, "2": 0.014611004519068885, "1": 0.011019586485094773}, "score": 4.493124755774107}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4554231236825791, "5": 0.29362181007622623, "3": 0.18708968091543515, "2": 0.04068757563867594, "1": 0.022936471348842087}, "score": 3.956337026287394}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3666144969617858, "2": 0.3212572419473588, "3": 0.23121644865801083, "4": 0.06132483373819023, "5": 0.019459933879396783}, "score": 2.045637218782825}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8835184717240736, "4": 0.09247504080586222, "3": 0.02042238246370936, "2": 0.0018859707573645713, "1": 0.0015577320961654847}, "score": 4.854770963140536}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3019034544408782, "4": 0.21349725575556008, "2": 0.17773530251328312, "5": 0.16681344279645333, "1": 0.1399262893035345}, "score": 3.0895473869557204}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8562053215318169, "4": 0.12762308595807184, "3": 0.014043733456902473, "1": 0.0010416541505563208, "2": 0.0010067502599758148}, "score": 4.837089635761192}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6147677160505854, "4": 0.286935335630766, "3": 0.07510553659200166, "2": 0.012937819663136944, "1": 0.01018793603856065}, "score": 4.483254460583549}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.366181817428236, "4": 0.3501990751686822, "3": 0.1772767159934456, "1": 0.05677376180698841, "2": 0.049284709409830124}, "score": 3.9199916812168696}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.34984971584852786, "4": 0.30566162180033124, "3": 0.2089841222497688, "2": 0.07877683479658124, "1": 0.05644926549919453}, "score": 3.8139123132887014}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8717183154502596, "4": 0.10739893641311823, "3": 0.017185320824266315, "2": 0.0017808174117556043, "1": 0.001625152697374563}, "score": 4.84634257435005}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9508189244324208, "4": 0.04431771919828005, "3": 0.0039887993825137875, "1": 0.00026071022929305236, "2": 0}, "score": 4.946629079553059}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4083123637792833, "4": 0.37413074765516957, "3": 0.15732747782047718, "2": 0.03683070156386362, "1": 0.023221876314786376}, "score": 4.107676894700657}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3903628218089961, "4": 0.3242350705071866, "3": 0.1709064753289458, "1": 0.061289563707737686, "2": 0.05300933228931347}, "score": 3.929555131711397}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4588029334512894, "4": 0.3890469299871268, "3": 0.13186609540854016, "2": 0.01447853168696631, "1": 0.0057430376575486304}, "score": 4.280768201793514}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5460545498923387, "4": 0.23665469107185566, "3": 0.1631651012009112, "2": 0.0315660311558282, "1": 0.02224423956153629}, "score": 4.253104493591829}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.758844050317634, "4": 0.20187719742238744, "3": 0.03270463395359135, "2": 0.003435523373480204, "1": 0.002945500580271014}, "score": 4.710569074751762}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8580083307864458, "4": 0.1219126224836001, "3": 0.016127856253279386, "1": 0.0021416151320810747, "2": 0.001591671113339983}, "score": 4.832453682089893}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3236071172712358, "1": 0.2972594953306486, "3": 0.27188358517026373, "4": 0.08343032721878778, "5": 0.0237020674611048}, "score": 2.2126159093730817}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.300075400771654, "3": 0.2749809930186569, "5": 0.23454694951124602, "2": 0.09719062721445802, "1": 0.09303937391470812}, "score": 3.4859809161765147}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8177869243425278, "4": 0.12612148120047934, "3": 0.04506917713205255, "1": 0.005669373846821267, "2": 0.0052371071694137655}, "score": 4.745321821191929}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.751559235405945, "4": 0.18747868875589788, "3": 0.045776555846437264, "1": 0.008362981305226417, "2": 0.0066893705330083415}, "score": 4.667403871519011}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6705721605853573, "4": 0.23025607956596908, "3": 0.07349271450920719, "2": 0.013018932953193313, "1": 0.012467712205438198}, "score": 4.533741135444426}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.34715069977972335, "5": 0.3449462055674266, "3": 0.19403094933270085, "1": 0.05874717571791267, "2": 0.05505497211005703}, "score": 3.8645543040018278}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8844962633335348, "4": 0.094455023460105, "3": 0.01755841424161731, "1": 0.001794618525931451, "2": 0.0016560351456925255}, "score": 4.858275949824345}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7174513848145172, "4": 0.15077917948741462, "3": 0.09135177185622793, "1": 0.023265004506094183, "2": 0.017101937804386784}, "score": 4.522127206922734}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.918956928055093, "4": 0.06475712149315926, "3": 0.013072611010860092, "1": 0.0019004790367168297, "2": 0.001287963487391913}, "score": 4.897629301161307}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9048356355080018, "4": 0.07851004504685052, "3": 0.013773263411790408, "1": 0.0015550715835083127, "2": 0.0012924618092335757}, "score": 4.8838418624403355}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"1": 0.750202319122614, "2": 0.164468486262743, "3": 0.061808165216602755, "4": 0.015042266104026921, "5": 0.008443903308276367}, "score": 1.367000021856662}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.3484807803303721, "3": 0.19655714022400042, "5": 0.18585676176209837, "4": 0.1354009096884924, "2": 0.13358043142197185}, "score": 2.6765323387178306}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3488797751286402, "4": 0.23425987568771708, "3": 0.22355109010000287, "2": 0.09917863111926628, "1": 0.09391225407042407}, "score": 3.645157172168779}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4245904592233243, "4": 0.244778416530142, "3": 0.18928616660663963, "1": 0.07363597366761067, "2": 0.06744559541116818}, "score": 3.87947343547311}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6855742642235793, "2": 0.13240342066163696, "3": 0.08828468758001164, "5": 0.053343289057976855, "4": 0.04028190976565964}, "score": 1.6432640026932894}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6835136447223868, "4": 0.2131824515246499, "3": 0.08951957164589722, "2": 0.008858976856355541, "1": 0.004826474475969795}, "score": 4.56185225232187}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7041787632405544, "4": 0.2185358728760034, "3": 0.06901068025905051, "2": 0.0057603704045293535, "1": 0.002436099705412024}, "score": 4.616387252869519}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9329929018887628, "4": 0.0547571678072922, "3": 0.011100471434379715, "2": 0.0005816480606085098, "1": 0.00045045832208063597}, "score": 4.919485663296158}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7732547303071314, "4": 0.18336237369413283, "3": 0.037890960673405555, "2": 0.0035767775844238177, "1": 0.0018176115044219025}, "score": 4.7228278890918185}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7263055245275524, "4": 0.17721646987708695, "3": 0.0737670960336778, "2": 0.012291913153810044, "1": 0.010246660821352789}, "score": 4.597317558794028}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9167963126576749, "2": 0.06741628318231746, "3": 0.01180590321674063, "5": 0.002056474849762981, "4": 0.0018674593654298467}, "score": 1.104862403696619}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6165535369513193, "2": 0.1981761692872605, "3": 0.11951112687745377, "4": 0.04296295698621615, "5": 0.022679648465504618}, "score": 1.6568824550226093}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.28488320207278933, "3": 0.2812781054408126, "2": 0.2487792554524094, "4": 0.13703485081411904, "5": 0.04793212170726111}, "score": 2.414299278098868}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3140122440639148, "4": 0.2484448722769204, "2": 0.18271578881197673, "1": 0.171817897240571, "5": 0.0828938587335946}, "score": 2.8878680732809334}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.2736148823934988, "3": 0.26777818743354787, "2": 0.19050239734621474, "4": 0.1778779389767956, "5": 0.09011920365075708}, "score": 2.6203434127485705}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.30915920754462584, "3": 0.26520260445458665, "5": 0.17639903604886012, "2": 0.1479028262873542, "1": 0.10125109077166866}, "score": 3.3115788291997923}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3522760773998488, "4": 0.33277150356776747, "5": 0.2054577011607839, "2": 0.07200531811395332, "1": 0.03736591327154051}, "score": 3.597023485564657}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.48371072333826587, "5": 0.2392802068960406, "3": 0.22052861925012118, "2": 0.03826559842030972, "1": 0.01809128406608124}, "score": 3.887932690670506}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.562474403965633, "4": 0.3382662065989834, "3": 0.08073529812653135, "2": 0.012215573804214685, "1": 0.006182303761715462}, "score": 4.4388164316098155}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3808369302761716, "5": 0.34492416420911975, "3": 0.18418002554372634, "2": 0.05019188594050684, "1": 0.0397358848125397}, "score": 3.941144995913203}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3435991715374306, "4": 0.23643730531481563, "2": 0.2092178971542656, "1": 0.14076236007637233, "5": 0.06988407368362766}, "score": 2.8854514730508294}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.45974945542539314, "5": 0.2762560019141847, "3": 0.21333326747660306, "2": 0.03847361104899178, "1": 0.011977749005315107}, "score": 3.95003177623749}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.3736156813027056, "4": 0.36964980296885025, "3": 0.20634119374429935, "2": 0.03388991505018454, "1": 0.016317165942664875}, "score": 4.050552574591648}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5011875483219398, "4": 0.3697668526244529, "3": 0.1041373060629471, "2": 0.01511879964409876, "1": 0.009638656955832449}, "score": 4.337947646906612}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3005527498938932, "3": 0.2938408749013004, "5": 0.14513919957428684, "2": 0.1444710843151083, "1": 0.11584114106955357}, "score": 3.214711052118566}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.35250573054383916, "2": 0.20326890933970418, "3": 0.19900721472805283, "4": 0.14863048792653566, "5": 0.09653822838656048}, "score": 2.433398567687407}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.26295988156972516, "3": 0.2545036757678964, "4": 0.18078950143397365, "1": 0.17022615542536237, "2": 0.13146706697299101}, "score": 3.2348025000653053}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8816286353474461, "4": 0.08842518957372886, "3": 0.027007023963873285, "2": 0.0016976318983811791, "1": 0.0012115431516213468}, "score": 4.847617126357978}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9601337800599876, "4": 0.0338511942363334, "3": 0.005098380187473522, "1": 0.000521469380256428, "2": 0.0003518928964904642}, "score": 4.952808446574914}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.783931190267082, "4": 0.14946614001465627, "3": 0.049047404978864055, "1": 0.010091260769943258, "2": 0.007444475986081838}, "score": 4.689734520130464}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3247902791070812, "2": 0.2723514366915601, "3": 0.26958023902914735, "4": 0.09461748397213404, "5": 0.038606655310617834}, "score": 2.2498583626354645}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3385929264771441, "4": 0.23002819284132042, "3": 0.21582210469694887, "1": 0.13091195250973645, "2": 0.08458164483799213}, "score": 3.560843929293087}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3215959291091934, "2": 0.2093191621937988, "4": 0.20881591596347215, "1": 0.16960755680223488, "5": 0.09060429145518183}, "score": 2.841481164599763}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6036724677904521, "4": 0.259613498032818, "3": 0.09430380879193577, "1": 0.022905599011225335, "2": 0.01944343885034784}, "score": 4.401789568772713}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.2636429904321239, "3": 0.25550083531732104, "2": 0.1845917590701626, "4": 0.1836915843007829, "5": 0.11245409331936167}, "score": 2.6966860162426753}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.41319650506036587, "5": 0.3957780122638123, "3": 0.1470476051605739, "2": 0.025896649022960773, "1": 0.01796616521924194}, "score": 4.143055073784606}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5515791129930114, "4": 0.30780094112374967, "3": 0.1167460752150392, "2": 0.015178652182321693, "1": 0.008634031789141506}, "score": 4.378596803133684}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3206687885200627, "4": 0.3186142039844869, "5": 0.24883227596088078, "2": 0.07344897731592707, "1": 0.038357346690937384}, "score": 3.6661673177408693}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5842249686740123, "4": 0.32437663000857647, "3": 0.07546813989008756, "2": 0.009279941834850064, "1": 0.006493348069553556}, "score": 4.470790801654676}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.47240070607740614, "5": 0.35355136503510387, "3": 0.13626252814197817, "2": 0.02113830038146338, "1": 0.016502143457459924}, "score": 4.125524001328755}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4218400775172929, "2": 0.25449759320273246, "3": 0.1841817936804586, "4": 0.09498658574840473, "5": 0.04442337873660691}, "score": 2.0855910641265827}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4394031281136316, "5": 0.25512856102187625, "3": 0.23313301697650374, "2": 0.04993361778272877, "1": 0.02229177728786742}, "score": 3.855237067341211}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.40208643541703054, "5": 0.2858799818838876, "3": 0.23369633968776782, "2": 0.050560719430615554, "1": 0.027615247863106814}, "score": 3.868195202832323}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3515158065129821, "5": 0.30789498867629517, "3": 0.21510037485691483, "2": 0.07169071770059576, "1": 0.05367522732576955}, "score": 3.7883614892578437}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3570240973145333, "4": 0.29112513123266764, "3": 0.21173764378455603, "2": 0.08153270914890558, "1": 0.058475875173332144}, "score": 3.8067732091369146}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3282256335280217, "4": 0.23248285467668145, "2": 0.16673402514583702, "5": 0.14267747722466287, "1": 0.12978721204761542}, "score": 3.0915378543577368}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.2690569800672586, "2": 0.2553821316620795, "3": 0.23771973101609192, "4": 0.16902183013578587, "5": 0.06871969772242256}, "score": 2.5129166059595085}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5431139436965344, "4": 0.19218761934488066, "3": 0.16697805205879704, "1": 0.053394742121921704, "2": 0.04422351578686336}, "score": 4.127517656692824}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4645612347641862, "4": 0.36398027586414133, "3": 0.12205445272679566, "2": 0.024655243082388912, "1": 0.0245829786581372}, "score": 4.219483753575806}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7688956764443989, "4": 0.1459357387082959, "3": 0.06310589441063909, "2": 0.012466546528843218, "1": 0.009489241460076087}, "score": 4.652458714029427}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.397078374858371, "4": 0.23317267627561922, "2": 0.19225714617996784, "1": 0.09241575557403481, "5": 0.08494111731634885}, "score": 3.025969757674376}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3162363506094669, "4": 0.31223570863720707, "2": 0.14677772666918193, "1": 0.11523485681134615, "5": 0.10935738485817481}, "score": 3.153727322738049}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.41213111086593307, "2": 0.23516316185282737, "4": 0.19329648057406537, "1": 0.1099596498532902, "5": 0.049280471107070505}, "score": 2.836747351002618}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.39170336797264405, "5": 0.35526226060131805, "3": 0.18919801764172198, "2": 0.040433226253888246, "1": 0.023279421641632356}, "score": 4.015361425825758}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3363509399349275, "3": 0.2670878362401457, "5": 0.1647314346436465, "2": 0.11780530203399131, "1": 0.1139619452400048}, "score": 3.3201046366627267}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4632021319863629, "4": 0.3971813903493408, "3": 0.10958975336873172, "2": 0.018952565007827375, "1": 0.01075206983663164}, "score": 4.283542365096821}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8253444208085075, "4": 0.14694081387205737, "3": 0.023438104115242785, "2": 0.002302771227068236, "1": 0.0016277786256146494}, "score": 4.792691797991817}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.29464781008041707, "4": 0.25406285041340604, "5": 0.2445415367592591, "2": 0.11166604533554038, "1": 0.09467307860876553}, "score": 3.442314485933342}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8314426786562016, "4": 0.14530302349283417, "3": 0.02084352355194202, "2": 0.0013484539028338956, "1": 0.0007344798473227986}, "score": 4.8059630351204214}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5674067047826447, "4": 0.2939520853280488, "3": 0.11128809384084865, "2": 0.0183575379750707, "1": 0.008970211720614147}, "score": 4.392502856195726}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3247219504207869, "3": 0.23032120519360003, "5": 0.21321675534076817, "1": 0.13274531651129667, "2": 0.09879085887665875}, "score": 3.386952874178689}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3767669697580754, "3": 0.26014294775319047, "5": 0.19615021700607782, "2": 0.09148996361358278, "1": 0.07535828548259306}, "score": 3.5269091427031207}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8924577324939416, "4": 0.094700357852099, "3": 0.01185754861836983, "1": 0.0004748232160221877, "2": 0.00044333582727503385}, "score": 4.878347190906916}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9347572958689858, "4": 0.05732819023867098, "3": 0.0068672152793169, "1": 0.0005407383702857054, "2": 0.0004336444063126583}, "score": 4.925468057943719}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8085859480897413, "4": 0.17090580879499176, "3": 0.018670164696796634, "2": 0.0009130593262655875, "1": 0.0008236949523959275}, "score": 4.785698190076485}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2431444178585563, "4": 0.22108801474120932, "3": 0.21810379623246823, "5": 0.162904767073397, "2": 0.1546909072182952}, "score": 2.9059113988127803}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9328466014136088, "4": 0.05678409557198138, "3": 0.008866829388008113, "1": 0.0008614401295502658, "2": 0.0005985341352037053}, "score": 4.9202374928725545}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7370618861244472, "4": 0.17234613699371273, "3": 0.06859038598931559, "1": 0.01274757272514065, "2": 0.009194052236761334}, "score": 4.611877369282063}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.48006207045142213, "4": 0.3170354759031698, "3": 0.14241611774469287, "1": 0.03124327893535846, "2": 0.02918404859403332}, "score": 4.185558968245088}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7531152563600655, "4": 0.18271926044494458, "3": 0.04930483153485754, "1": 0.008740398459693098, "2": 0.006072060349232745}, "score": 4.66547717999038}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4134978351340218, "5": 0.27448026910909157, "3": 0.2534966426557854, "2": 0.04516935991472199, "1": 0.013327077648453063}, "score": 3.8906605230026567}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7789474762245492, "4": 0.16131279060526355, "3": 0.05098054447104935, "2": 0.005465844721214874, "1": 0.00323617662500718}, "score": 4.707367150743595}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.30794665779031244, "5": 0.2699342414046808, "4": 0.24660532372038152, "2": 0.11815067054441314, "1": 0.0573083351926648}, "score": 3.5537367945104226}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9222097008660529, "4": 0.07010152714103991, "3": 0.007120174823481017, "2": 0.0003043199326257653, "1": 0.00023907266848710023}, "score": 4.913786699771157}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8561497470480858, "4": 0.12746470197089993, "3": 0.01475116819015304, "2": 0.0008769762911447426, "1": 0.0007252704051687903}, "score": 4.837495728902065}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.659562765507484, "4": 0.24514460942769914, "3": 0.07634381187847611, "2": 0.010318481203116209, "1": 0.008530175015887459}, "score": 4.537045254999176}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6373655539218926, "4": 0.24889615940520923, "3": 0.08065740194589004, "1": 0.018211081437378512, "2": 0.014812705303958293}, "score": 4.4724764745109225}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5694059070649313, "4": 0.2838791385178689, "3": 0.10168947214679176, "2": 0.023532194892358697, "1": 0.021395595412165125}, "score": 4.356500086091176}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3302993217578517, "4": 0.21699147758820211, "5": 0.1899656713976792, "1": 0.13321085902327554, "2": 0.12940775089296958}, "score": 3.2011184750312065}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6719945826662757, "4": 0.25670656932072206, "3": 0.05168490567298097, "1": 0.012771215876014505, "2": 0.006811043091446365}, "score": 4.568391951756326}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3844727745329391, "2": 0.25099757531415007, "3": 0.20089284952594838, "4": 0.10297186329128717, "5": 0.06052353386972157}, "score": 2.203963244294419}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.712336476390787, "4": 0.1980737188809575, "3": 0.06183090244088866, "1": 0.014816082985808693, "2": 0.012794037972062274}, "score": 4.580555624886064}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5649032338645614, "4": 0.2551794897651757, "3": 0.11350768898431801, "1": 0.03477625683198978, "2": 0.031469784994730673}, "score": 4.284173679738182}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.42614270523262987, "4": 0.2937095867528288, "3": 0.16444784676287275, "1": 0.058211002250857485, "2": 0.05734821847324887}, "score": 3.9723615276813593}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.35791605618726247, "4": 0.27009503511701344, "3": 0.20190251441028617, "2": 0.08585644685922789, "1": 0.08406023952133952}, "score": 3.732074460412517}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6593516996274302, "4": 0.24165221852417454, "3": 0.06985117302039917, "1": 0.01688712975737183, "2": 0.012169145355039834}, "score": 4.514546452788787}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7986327068160574, "4": 0.17130698466899263, "3": 0.023292957903365937, "1": 0.004147415126012338, "2": 0.0023759795129849365}, "score": 4.758330543774033}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9197004718738053, "4": 0.06047654953969508, "3": 0.016786018016784393, "1": 0.0017283708834572383, "2": 0.0012275843300544793}, "score": 4.895346700424933}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9752755553912058, "4": 0.022588530534461256, "3": 0.0018720999692040513, "1": 0.00011309809709066108, "2": 9.938453896615065e-05}, "score": 4.972915333226134}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7157847612456336, "4": 0.2324420342715367, "3": 0.043055960603674136, "1": 0.004412013137150524, "2": 0.004267982695611025}, "score": 4.6509810436114}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4068026665045247, "2": 0.32220045373501, "3": 0.19958621113121952, "4": 0.05433215251132754, "5": 0.016604728081294116}, "score": 1.951238931482316}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.34314554238262746, "3": 0.2925203915615042, "5": 0.23561993901310818, "2": 0.07857477969946391, "1": 0.050013995636112404}, "score": 3.635862355868997}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.43455815488469357, "4": 0.3473691262578106, "3": 0.17294696364709383, "2": 0.029176674716682255, "1": 0.01576033402968568}, "score": 4.156006285349904}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.890005924087513, "4": 0.09738993601567036, "3": 0.011014060446560172, "2": 0.0008135826812681969, "1": 0.000704433235321499}, "score": 4.875314476826722}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6133196972738776, "4": 0.31107090575747515, "3": 0.06386654545509637, "2": 0.007689416316275052, "1": 0.003978715302936607}, "score": 4.522177190301908}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"4": 0.36318130739605275, "5": 0.23888483622024237, "3": 0.2334294240554141, "2": 0.09670873980469394, "1": 0.06754565765918011}, "score": 3.6093032717744307}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.49049151441198147, "4": 0.31659453285125705, "3": 0.13163859868741576, "2": 0.0344868150656949, "1": 0.02663359207417469}, "score": 4.210011049933795}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5732217149630302, "4": 0.28626380448539496, "3": 0.11464672904526925, "2": 0.016199783516695997, "1": 0.00958394956537778}, "score": 4.397456963896042}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5849671600457116, "4": 0.3013726922239876, "3": 0.08490010066300421, "2": 0.01628302703305991, "1": 0.012338850712153283}, "score": 4.430543941144602}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3679109329994376, "5": 0.3302363727063598, "3": 0.19127821265590855, "2": 0.06036287592569035, "1": 0.05005442327515308}, "score": 3.8680483978991673}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"4": 0.36592023737518614, "5": 0.3574396293711212, "3": 0.21847886430386165, "2": 0.04036222323115909, "1": 0.01757818384644537}, "score": 4.005502982464615}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5113524502570649, "4": 0.4021712966713169, "3": 0.07439321035327194, "2": 0.008298224522616433, "1": 0.003597926757892238}, "score": 4.409645569834433}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6417760294142848, "4": 0.28381195227758693, "3": 0.06823893381283337, "2": 0.004542656981037194, "1": 0.0015409074235755488}, "score": 4.559879179803596}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6232685024346669, "4": 0.2874853145141901, "3": 0.07368841378110833, "2": 0.010003502473103621, "1": 0.0054673824796105264}, "score": 4.513215526649191}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.43933465247221803, "3": 0.2762632675425777, "5": 0.19629008272297932, "2": 0.06086933265397087, "1": 0.027080293303391116}, "score": 3.7170013190971942}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7313868299939533, "2": 0.1680183801346227, "3": 0.05184357847997636, "4": 0.02960224724780463, "5": 0.018889795941286276}, "score": 1.436184507757906}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8114187339896901, "4": 0.1550168280331745, "3": 0.028128969236678365, "2": 0.002717779751046407, "1": 0.002565810155838892}, "score": 4.770273763064068}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6279007728587714, "4": 0.23644253063700268, "3": 0.10188158209364939, "2": 0.018077702612221865, "1": 0.015569903359431023}, "score": 4.443210588552645}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8717681268579028, "4": 0.10300695178209548, "3": 0.019880490599797164, "1": 0.002804319140866996, "2": 0.0023456939344163154}, "score": 4.838946396982947}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.67100371869932, "4": 0.2468131515698836, "3": 0.06307558561971867, "2": 0.01029321231011299, "1": 0.008722965662248984}, "score": 4.561224088350535}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.40985645104185664, "3": 0.24615639328231215, "5": 0.17275682658164015, "2": 0.09963046377129423, "1": 0.07150945501877691}, "score": 3.512767089824823}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.34189954949127654, "4": 0.24338038236816467, "2": 0.15762688909919317, "1": 0.1448959036849844, "5": 0.11201556994309456}, "score": 3.019996459250084}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.33311310234063235, "3": 0.24905610166596492, "2": 0.1741546119309943, "4": 0.12444868708039984, "5": 0.11911703282998778}, "score": 2.5222491617868963}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5097717512557347, "4": 0.32374710762018644, "3": 0.11502612528824735, "1": 0.02800994649283157, "2": 0.02335320138459152}, "score": 4.264033639951263}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.467104676382949, "4": 0.38380425844142124, "3": 0.11347007876854559, "2": 0.019869950770514826, "1": 0.01565585986202339}, "score": 4.2669525239005335}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.34184303816653533, "2": 0.2662799446802383, "4": 0.18171255655433452, "1": 0.17614839249676484, "5": 0.03389400919920422}, "score": 2.6308787907491284}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8117528313882737, "4": 0.1607470608520736, "3": 0.023578285416062973, "2": 0.0022137609998571614, "1": 0.0016261532867595922}, "score": 4.778932364948743}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.40601543616187896, "5": 0.25257382418234314, "3": 0.24118881198742537, "2": 0.06844130926685846, "1": 0.03165592323109627}, "score": 3.779507129571863}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9885063692932134, "4": 0.010720858956610015, "3": 0.000633209390398666, "1": 3.623300913722283e-05, "2": 0}, "score": 4.987866536483137}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5891561264982993, "4": 0.27712278606987245, "3": 0.0962857448203401, "2": 0.02017916182207106, "1": 0.017126128486209948}, "score": 4.401185847718697}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5582374329636423, "2": 0.23431226205249817, "3": 0.14148953814545615, "4": 0.049760429458081595, "5": 0.016132826011342936}, "score": 1.7311532919226982}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3028132500363173, "2": 0.27648030229412035, "1": 0.263368865240118, "4": 0.12555684183009164, "5": 0.03171487389812112}, "score": 2.3857280967880534}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6253937672686388, "4": 0.26287493295617753, "3": 0.0845099331040863, "1": 0.013953670319226515, "2": 0.01322246502685293}, "score": 4.472599269444327}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7056951737168098, "4": 0.22861808928992994, "3": 0.05019487746605545, "2": 0.007800249957240367, "1": 0.007626959544974163}, "score": 4.617058810568875}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.2908612295354649, "4": 0.2530098900277187, "2": 0.17187001751244377, "1": 0.16690716822759516, "5": 0.11726487664532884}, "score": 2.981853713925544}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3012750934159565, "3": 0.25964553631519666, "2": 0.2342348814924452, "4": 0.13941258569152018, "5": 0.06533091006169743}, "score": 2.433232097886679}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.2857602518386852, "1": 0.23293375014236398, "2": 0.20372292889651342, "4": 0.18034330402324356, "5": 0.09703569291175623}, "score": 2.7047640112114726}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3329547114175063, "5": 0.3036077520576251, "3": 0.2525277084125454, "2": 0.07020015921029663, "1": 0.04061168686413406}, "score": 3.7888239731746216}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.2942778176035031, "2": 0.2818777817606403, "1": 0.25002296633481313, "4": 0.13387540834805203, "5": 0.03981106461205701}, "score": 2.4314970972278163}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.36921031055365744, "4": 0.23875775941067304, "3": 0.1941834787736551, "1": 0.11431101998633071, "2": 0.08336369301125081}, "score": 3.6653082370324905}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.36909281330400306, "4": 0.24444171083065042, "2": 0.20006691367792476, "1": 0.10825643155082904, "5": 0.07803205306290484}, "score": 2.98392427059959}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4801581933006039, "4": 0.2589858893605897, "3": 0.18746147900220986, "2": 0.04850160930707602, "1": 0.024785997554599835}, "score": 4.121348466856135}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.33283463630994553, "3": 0.30042504211501353, "5": 0.2746086460951272, "2": 0.05968887048497327, "1": 0.03229303198644473}, "score": 3.757890505583468}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7843459211395256, "4": 0.18683083447999996, "3": 0.02596674754707899, "2": 0.0017793906584478501, "1": 0.0010109484796849604}, "score": 4.751837286658593}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5078050321764633, "4": 0.3631154322819446, "3": 0.10500958996449784, "2": 0.016327011426260814, "1": 0.007667275053999716}, "score": 4.347165860452899}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8369866486948448, "2": 0.10146889303846866, "3": 0.036499307177945195, "4": 0.014375412457711291, "5": 0.010583257581401636}, "score": 1.259949255777589}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5339790355832511, "4": 0.15591780525166601, "3": 0.14290857340639257, "1": 0.10871288006676695, "2": 0.058209244305134605}, "score": 3.9484993014145315}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3934190146724066, "2": 0.18154551234312652, "3": 0.16307566229783868, "4": 0.1439925668263377, "5": 0.11783306023293794}, "score": 2.4111961377662405}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4889132784097719, "4": 0.2840346333047083, "3": 0.13217103175112282, "1": 0.051654281105875575, "2": 0.043015769412264315}, "score": 4.115772293166867}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.25497915047745073, "4": 0.2539342255565192, "3": 0.22172588772651006, "1": 0.157695708254973, "2": 0.11139024752278306}, "score": 3.3372035194174656}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"4": 0.403935607944629, "5": 0.346239966333035, "3": 0.18128005106702566, "2": 0.04052039708180466, "1": 0.027913528924399106}, "score": 4.000178554050256}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4435048684293359, "4": 0.27763463285720336, "3": 0.17081783204560105, "2": 0.05984227069078513, "1": 0.04797679607793448}, "score": 4.009074135744198}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4139910598314557, "4": 0.2800461130243541, "3": 0.237235893888369, "2": 0.04459180416318159, "1": 0.024044187394983003}, "score": 4.015440399607927}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5211547272671954, "4": 0.34523770472460596, "3": 0.10272131883470499, "2": 0.01763510078949986, "1": 0.013187586612432849}, "score": 4.343622288257581}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6026454933686828, "4": 0.26022196516460977, "3": 0.1035496366582408, "2": 0.01973740327465194, "1": 0.013741158223476125}, "score": 4.418441237034563}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.42804784596948836, "3": 0.286350727370663, "5": 0.14374143265535974, "2": 0.09590158208424407, "1": 0.04585454305588246}, "score": 3.5279748832357325}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6312995035512773, "4": 0.258848197280197, "3": 0.08920763936124915, "2": 0.013589932740797799, "1": 0.0069234990090360935}, "score": 4.494206355421323}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.31560817099306093, "4": 0.2985343731045472, "5": 0.17702831277847375, "2": 0.13041901755206808, "1": 0.07822331735353943}, "score": 3.3657936796679158}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.46172404571706543, "4": 0.4341551718320355, "3": 0.08642934669690543, "2": 0.010558036030088638, "1": 0.006975148926730969}, "score": 4.3333059261083}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.47438652310349744, "5": 0.2473947598819712, "3": 0.18036206070219238, "2": 0.05915555968445966, "1": 0.038533364599753914}, "score": 3.833093490444243}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"2": 0.2884581396774897, "1": 0.28164597627584653, "3": 0.2469158718917327, "4": 0.14387016759903642, "5": 0.039056287661447704}, "score": 2.370198920502812}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.31551003211326895, "3": 0.2956032781950089, "5": 0.2392193178318476, "2": 0.08814261070741346, "1": 0.06137487067487613}, "score": 3.583143723411001}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.37572685088676844, "5": 0.2787604689895132, "3": 0.257574391905038, "2": 0.05387027701585811, "1": 0.03395690018910545}, "score": 3.811553884046467}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.44311825644023994, "4": 0.37280720859413036, "3": 0.14363159868812833, "2": 0.023398204273778395, "1": 0.016960185689584243}, "score": 4.201826755844103}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.31855322706152195, "4": 0.27592312077040043, "5": 0.16585184319899046, "2": 0.1488195620253224, "1": 0.09072049342766637}, "score": 3.2774028070829346}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"1": 0.2955203435514221, "3": 0.2805700647515502, "2": 0.2459092779230074, "4": 0.1219042473741238, "5": 0.055897378285579793}, "score": 2.3966291563042645}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.30730614908710396, "4": 0.234557551272962, "2": 0.17431002714971944, "5": 0.15565321920130182, "1": 0.12782872462116845}, "score": 3.115936433521207}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7467364032145954, "4": 0.15524654699406792, "3": 0.06671609839064176, "2": 0.016767422701841898, "1": 0.014384179819145299}, "score": 4.603423040517924}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8534703727533443, "4": 0.11289939122525552, "3": 0.02678599775043699, "2": 0.0038509631235757666, "1": 0.002905146673312992}, "score": 4.810338422624486}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.275594278560019, "4": 0.26639977098025497, "3": 0.26242923873864993, "2": 0.11083250292371667, "1": 0.08443730269189197}, "score": 3.538046349502479}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3038890534333025, "3": 0.2992433072121522, "2": 0.15922760856070917, "5": 0.14773016186025933, "1": 0.08985086847206555}, "score": 3.260435397457625}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5455505558508287, "4": 0.3143949439941301, "3": 0.11150386778822162, "2": 0.01901267722388124, "1": 0.009431293718171363}, "score": 4.367766678978292}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5675097778973183, "4": 0.32175834389196223, "3": 0.09610414805438668, "2": 0.010475986929487126, "1": 0.003917443524685414}, "score": 4.438804137088527}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8821242763588824, "4": 0.10233694781695024, "3": 0.014084491225942904, "2": 0.0008271964051704134, "1": 0.0005577652405326681}, "score": 4.864772045152429}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4049008526976322, "5": 0.37533373079300647, "3": 0.16911195969533083, "2": 0.03514571761038695, "1": 0.015318138957786637}, "score": 4.089992981694996}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6213056364047957, "4": 0.28525858337008353, "3": 0.07393285223103091, "2": 0.010567162115119651, "1": 0.00855242508994284}, "score": 4.500773151448698}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5268279259408923, "4": 0.2967550286174638, "3": 0.1431492624126518, "2": 0.018003656550896224, "1": 0.015219384006535426}, "score": 4.302026711828405}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.45360114605296237, "4": 0.36313743774389967, "3": 0.14969993825722894, "2": 0.01690050121162974, "1": 0.01655292426530037}, "score": 4.220465254391634}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8526557146697737, "4": 0.13616066911327113, "3": 0.010178424948671034, "1": 0.0005206140383784973, "2": 0.000404463645766644}, "score": 4.840173829651229}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9870781088900381, "4": 0.011843093598474099, "3": 0.0008864921389517894, "1": 0.00010685732761812287, "2": 3.7509849730382665e-05}, "score": 4.985843284616573}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"3": 0.2849087572421475, "4": 0.2796359221342301, "2": 0.16584889106245562, "5": 0.1412769967195519, "1": 0.12816372895430111}, "score": 3.1400367712396378}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5804885514014487, "4": 0.2812627480755154, "3": 0.09510437559752696, "1": 0.02303511012125193, "2": 0.01994191860839943}, "score": 4.376457988212696}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8424303843679325, "4": 0.12625886442805256, "3": 0.026955174401530304, "2": 0.002261472792162049, "1": 0.002039986069144631}, "score": 4.804875864399329}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8680220512314081, "4": 0.10904866810791077, "3": 0.019709841489220472, "2": 0.0018095591986893194, "1": 0.0013774986458316646}, "score": 4.840587814756164}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9251621033118694, "4": 0.06548265372763097, "3": 0.007711396341176069, "1": 0.0008877876290942112, "2": 0.0007190015819766209}, "score": 4.9133831885331665}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3167224312104106, "2": 0.23091169829567826, "4": 0.22738594658345193, "1": 0.15456618384023343, "5": 0.07013668486005203}, "score": 2.8275674769985093}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7186232501780533, "4": 0.24274416722712386, "3": 0.035044194991597, "2": 0.0020539771339225113, "1": 0.0015103362059375749}, "score": 4.674956341377521}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.39344258117719527, "4": 0.3765270267959377, "3": 0.19074038812413055, "2": 0.026207116053438485, "1": 0.012947727355774628}, "score": 4.111459843846366}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.47858238952286764, "5": 0.2636145976110352, "3": 0.19998132335891666, "2": 0.03774518353137746, "1": 0.019997624249678835}, "score": 3.928144366343913}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.709492998959599, "4": 0.2334212775106726, "3": 0.04649949623980921, "2": 0.005401477779394081, "1": 0.005118954807142245}, "score": 4.636875585779833}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5032985229172383, "2": 0.16512747955867596, "3": 0.15233392389364847, "4": 0.1043489925535023, "5": 0.07450107680073025}, "score": 2.0812683114746005}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7604154502438843, "4": 0.18340242440992657, "3": 0.046473050199687754, "1": 0.005077254074753979, "2": 0.004456056040599871}, "score": 4.689919789512028}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3961495608960499, "5": 0.3843899833914858, "3": 0.18109878918624825, "2": 0.020636176554111367, "1": 0.017553428360001382}, "score": 4.109377375664595}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8266903332248416, "4": 0.13504928406720904, "3": 0.029763647877507057, "1": 0.0052417230938461715, "2": 0.0031826948625882736}, "score": 4.774892164119621}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.513958040565597, "4": 0.3063912803219275, "3": 0.10324491476753989, "1": 0.04900329687361104, "2": 0.027204926520598013}, "score": 4.209334734318465}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.45446330758940645, "4": 0.3499169984178972, "3": 0.13574956833850482, "2": 0.03333743297415699, "1": 0.026188670117679}, "score": 4.173532562066205}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4553770326407077, "4": 0.37315673370353497, "3": 0.1386323103480691, "2": 0.021383664276947194, "1": 0.01134359513070329}, "score": 4.23997220471789}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3042810494188116, "5": 0.268426726961261, "3": 0.26538953205654603, "2": 0.09452382120546618, "1": 0.06717064212834424}, "score": 3.612396916204835}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5276899730409242, "4": 0.38783014725986764, "3": 0.06769559281008422, "2": 0.009347839798204804, "1": 0.007232523296744412}, "score": 4.419686714851455}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5412122760086208, "4": 0.361782925621284, "3": 0.07295010971785583, "2": 0.013042291622525438, "1": 0.010618569191241304}, "score": 4.410483535315431}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2732323628078694, "3": 0.2642905005341104, "2": 0.1581782052826387, "5": 0.15364471305678842, "1": 0.150380669949243}, "score": 3.1216155114651705}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.3422946373805719, "4": 0.21690942692813606, "5": 0.18883701319875773, "1": 0.1352443279037537, "2": 0.11664016454670553}, "score": 3.2074700749778478}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9131233348972368, "4": 0.06890208087774002, "3": 0.015181343595940396, "1": 0.0014424979221985595, "2": 0.0012538760316394026}, "score": 4.891193072381345}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9425736438515172, "4": 0.04649170357728277, "3": 0.00894031907247641, "1": 0.0010146714636676919, "2": 0.0008643740107624925}, "score": 4.9289676612128055}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8460804494369059, "4": 0.10123858703408005, "3": 0.03772899809337616, "1": 0.008490491404034664, "2": 0.006332130674600423}, "score": 4.770315350955668}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.2886796162804667, "3": 0.27039346581247414, "5": 0.154018261874244, "2": 0.15248483965114845, "1": 0.13396277716106625}, "score": 3.176387067411757}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.37416553969102473, "5": 0.3142633029591421, "3": 0.2595548320117727, "2": 0.03264218854901565, "1": 0.019169490505065}, "score": 3.9319016862672926}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.663736596650581, "4": 0.26990827497966274, "3": 0.05680247955900581, "2": 0.005754143931509032, "1": 0.003589364900753851}, "score": 4.584780035410321}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7419103390321619, "4": 0.21372438812112735, "3": 0.038562094221153656, "2": 0.0037216505978775152, "1": 0.0019530979006557897}, "score": 4.690134283947036}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.40362409180590175, "5": 0.34475298634386753, "3": 0.1841268972704789, "2": 0.04077947450561087, "1": 0.026560118308434386}, "score": 3.999386689195571}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7350363832309091, "2": 0.16814585360594717, "3": 0.06834568833176287, "4": 0.01885145084774261, "5": 0.00938027686382829}, "score": 1.3990085908336003}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5360241301436158, "2": 0.2606087339706924, "3": 0.14765946035553212, "4": 0.04019590315972955, "5": 0.01540304595245174}, "score": 1.7382078106617291}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.6468479434201689, "2": 0.1811684350592514, "3": 0.11982657378426913, "4": 0.028854581340625438, "5": 0.023208580953710926}, "score": 1.6002760076427938}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.4646136402270801, "2": 0.21858896168690004, "3": 0.1871024782872749, "4": 0.08516438065423322, "5": 0.04437432688900863}, "score": 2.0259446329053112}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4612528245317865, "2": 0.21316147540346192, "3": 0.18712307940420503, "4": 0.08805297121284521, "5": 0.05028996624527601}, "score": 2.0528524215810076}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6124803982086577, "2": 0.23229006687987677, "3": 0.12134404754133081, "4": 0.02616816718124079, "5": 0.007686600967541853}, "score": 1.5842470149898062}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8641177195327453, "2": 0.08546562762084833, "3": 0.03188516896591485, "4": 0.009841757265203803, "5": 0.008635320082788762}, "score": 1.2133141233612297}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.3117021483089005, "3": 0.28863331578341445, "2": 0.2527237206946339, "4": 0.10703732217123779, "5": 0.03983256042593281}, "score": 2.3105255194821828}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6261637065560451, "2": 0.19121406870092633, "3": 0.12614804518150918, "4": 0.040798343454568564, "5": 0.01559729152488589}, "score": 1.628343708521173}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.757984077118786, "2": 0.1409710258705185, "3": 0.061240717013915584, "4": 0.024175929247873117, "5": 0.015583391177458024}, "score": 1.3983316813403206}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"4": 0.30580491898154016, "3": 0.23976866891297688, "5": 0.22149824783050398, "2": 0.12446322353596334, "1": 0.1081151084995415}, "score": 3.408250793396823}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.29726648101087033, "4": 0.2923113434667218, "2": 0.1573008288029699, "1": 0.128446693152068, "5": 0.1245408754617185}, "score": 3.127215897984893}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3727272872964771, "4": 0.28275612555836704, "5": 0.16091303744806573, "2": 0.1179370820129473, "1": 0.06556804635171726}, "score": 3.355544018854188}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5859360646794768, "4": 0.32266446620807393, "3": 0.0768224779508298, "2": 0.008956545260077463, "1": 0.005534063074774159}, "score": 4.474639307669263}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.47830892912926776, "4": 0.3522929165988021, "3": 0.12862562831252625, "2": 0.02192614979301902, "1": 0.018732801515610256}, "score": 4.2496609518392905}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3011776466860948, "4": 0.22180736478407975, "2": 0.21838188121994864, "1": 0.16790163113940512, "5": 0.09058804756203245}, "score": 2.8487766266513828}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.376916839781627, "5": 0.3642564960584851, "3": 0.1903709389194228, "2": 0.04506458031042697, "1": 0.02310743619624467}, "score": 4.014438184168424}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3594963337733567, "5": 0.3207076880033161, "3": 0.23438919939670405, "2": 0.053350752306158114, "1": 0.03193432911556375}, "score": 3.8837998553915565}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.38487776061723533, "5": 0.2573122374003803, "3": 0.23579129698984794, "2": 0.07646368933858842, "1": 0.04536523573350859}, "score": 3.7324470783606487}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.465920574672545, "4": 0.3371297526606865, "3": 0.14417148786490316, "2": 0.03401504337544927, "1": 0.018660156437940202}, "score": 4.197758896940645}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.640164208344508, "4": 0.28044795918056953, "3": 0.06517809713500666, "2": 0.007713382281412754, "1": 0.006378161431737602}, "score": 4.540488743595317}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4924684408084148, "4": 0.3827316837243439, "3": 0.11036557659119396, "2": 0.009611297975807126, "1": 0.0047759135689934866}, "score": 4.3485689407398}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8417444957650436, "4": 0.13500662873613647, "3": 0.021719070054572714, "2": 0.0009297898175442582, "1": 0.0005290773063581618}, "score": 4.816636544981141}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5944122361938566, "4": 0.33815855359930674, "3": 0.059719731637504686, "2": 0.005127697761324562, "1": 0.002470482014031131}, "score": 4.517083213729682}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.737447027844017, "4": 0.21864602085179743, "3": 0.03751416439961258, "2": 0.003789015712809735, "1": 0.0025337243084070996}, "score": 4.6848016273132735}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"1": 0.3924114391332925, "2": 0.25624570747164244, "3": 0.20945861518851253, "4": 0.09153590310516443, "5": 0.05024504720425583}, "score": 2.1508697068930824}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7307094773756154, "4": 0.19634958726451035, "3": 0.05525632309357722, "1": 0.00920592758208756, "2": 0.008405432970533219}, "score": 4.6310707326073235}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4490554060849498, "4": 0.20552432134604873, "3": 0.2042597113465459, "1": 0.07464296494203615, "2": 0.06635401550433447}, "score": 3.8881404708350336}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8813111298991579, "4": 0.09895092092536151, "3": 0.01655680638120087, "1": 0.0018157608463750666, "2": 0.0013247726753985235}, "score": 4.856692285278502}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9429494483968186, "4": 0.04659388358527068, "3": 0.008250371907125737, "1": 0.0013158303075814653, "2": 0.0007982406017546853}, "score": 4.929240803783762}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.318668118068804, "1": 0.29032720469296386, "3": 0.23168458030901481, "4": 0.11893160488114626, "5": 0.04019429133633012}, "score": 2.2998616927414877}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7934351015080287, "4": 0.1498014692304779, "3": 0.04647816716419847, "2": 0.005758013743165619, "1": 0.004428560904315564}, "score": 4.7222264988359095}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.48447962606545153, "4": 0.2718529456167863, "3": 0.1847472692588507, "2": 0.03473762102265654, "1": 0.024110424021212745}, "score": 4.157937232185587}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5667332185511361, "4": 0.3215921342996193, "3": 0.09144107529459845, "2": 0.012907970373494573, "1": 0.007213105494218768}, "score": 4.427885021374666}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.38769846250319545, "5": 0.3312228722929368, "3": 0.20471074423061872, "2": 0.04722705743001953, "1": 0.028949000517436378}, "score": 3.9452004976516366}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.27946816295853244, "3": 0.27291723452518, "2": 0.15966801908727427, "5": 0.14515689312111468, "1": 0.1423368140552369}, "score": 3.125497136675991}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4726908491757536, "4": 0.362192442244441, "3": 0.12657288129477667, "2": 0.02102462309079212, "1": 0.01728719370263742}, "score": 4.25226566887333}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3986865738420247, "3": 0.2935337660982388, "5": 0.20122187982981152, "2": 0.06683977109043245, "1": 0.03949851115752449}, "score": 3.6554374072843716}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8437211752884917, "4": 0.13266122245224027, "3": 0.020382864634511614, "2": 0.001973502689608751, "1": 0.0011794712902773751}, "score": 4.81591960396467}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4039623493670063, "4": 0.3544046994641872, "3": 0.17057145144248353, "2": 0.03756353173158863, "1": 0.033390585165764805}, "score": 4.058098317725767}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3242598105868883, "4": 0.3202248095510212, "5": 0.15962505820398395, "2": 0.11466920200644036, "1": 0.08108915910314173}, "score": 3.3626752645731144}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8524945438678166, "4": 0.09460000027663922, "3": 0.041821458915379556, "1": 0.005703832281309117, "2": 0.0052540960845530995}, "score": 4.783152126811492}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.337295290284153, "2": 0.1895189991724648, "4": 0.18101423579645146, "1": 0.15758015965455777, "5": 0.13430018472345756}, "score": 2.9449192510830344}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8659983636250078, "4": 0.11812971247449432, "3": 0.013398256398586762, "1": 0.0014272924800450516, "2": 0.0009546303122697153}, "score": 4.846486629831778}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9354484116546846, "4": 0.05481004494005899, "3": 0.007896333035438298, "1": 0.0010910464471838139, "2": 0.0006064229973290067}, "score": 4.923202488072868}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3855427990354537, "4": 0.29671137916325024, "3": 0.1972926933179377, "1": 0.07114094705483824, "2": 0.04915454326188649}, "score": 3.876498709512219}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.29260242577995804, "3": 0.28879277199350073, "1": 0.2723725992203447, "4": 0.11915475125309304, "5": 0.026979342456916966}, "score": 2.335700638003417}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5937711519090153, "4": 0.2935934769386498, "3": 0.09342396332557101, "2": 0.011048266954669799, "1": 0.008090858782184114}, "score": 4.454010895183899}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8523664406136838, "4": 0.12001182492659301, "3": 0.02214882126354047, "1": 0.003271116222087786, "2": 0.002152447956757453}, "score": 4.8161396504601255}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.26633022307992554, "3": 0.21590840762521246, "1": 0.21110367826543688, "5": 0.19227552684172425, "2": 0.11430210407449688}, "score": 3.114380973511691}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5171676201996961, "2": 0.2914374138550505, "3": 0.14611970440758368, "4": 0.03261453601363734, "5": 0.0125199175349151}, "score": 1.7317031304972264}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31816616539052894, "2": 0.27330141735062496, "4": 0.18781921521561643, "1": 0.16579445180821234, "5": 0.05487326639371029}, "score": 2.692661448098065}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.3340544083568755, "3": 0.31076657851696793, "1": 0.1870622181660919, "4": 0.13082857506749693, "5": 0.03724477546375273}, "score": 2.4971174338600957}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3440016242372406, "4": 0.3286803109048532, "2": 0.14713967106566334, "5": 0.11130288501137162, "1": 0.06881672965583935}, "score": 3.266528616869149}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.30866766458886863, "3": 0.3001820965406776, "1": 0.2100643009778945, "4": 0.13625856296010294, "5": 0.04476845576290215}, "score": 2.4969695698060423}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3979721026494463, "4": 0.3223657204984619, "3": 0.15408032833440194, "1": 0.0722192968068761, "2": 0.05320507991867558}, "score": 3.9208112540633246}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5535757388337463, "4": 0.2871195498371894, "3": 0.11954755942096358, "1": 0.02116811158972481, "2": 0.01830092818370428}, "score": 4.3340182229794415}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7750296982813222, "4": 0.17606030510333168, "3": 0.03486627323409701, "1": 0.007156453800218356, "2": 0.0066779181112644635}, "score": 4.705485921938698}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.679129247336041, "4": 0.2393033703411608, "3": 0.0597275076527715, "1": 0.0117403106983061, "2": 0.00990968616161434}, "score": 4.564468615329674}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.409897381350674, "5": 0.35805388039835273, "3": 0.1622820675648616, "2": 0.0400562284782528, "1": 0.029593634247107904}, "score": 4.026881593119736}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"4": 0.28083089161711233, "3": 0.2525845587979799, "5": 0.2232152335794442, "2": 0.12407742662161284, "1": 0.1189516703353632}, "score": 3.36540490919418}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.31118070205253373, "2": 0.19698637796908278, "4": 0.1889452100245306, "1": 0.16298879872747643, "5": 0.13960942173400606}, "score": 2.9451842094731338}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4038286599561839, "4": 0.2727936855749803, "3": 0.17733833035712898, "1": 0.074974576718366, "2": 0.07054369316012558}, "score": 3.8604064773277877}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.542644971877295, "4": 0.29021826533679146, "3": 0.11336835308060211, "1": 0.028733853123477364, "2": 0.024791966741472247}, "score": 4.293562341184801}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4375934044875267, "4": 0.32590214871096, "3": 0.15769941414766106, "1": 0.04055095287215545, "2": 0.037997150838536}, "score": 4.082267967068161}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4097530163276238, "3": 0.270181128122897, "5": 0.22301393961307087, "2": 0.062115532533836976, "1": 0.034833618837050793}, "score": 3.7240725343452246}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6203689917434577, "4": 0.2929918166140471, "3": 0.07358830980750089, "2": 0.007705574122557229, "1": 0.005261342798111865}, "score": 4.5156288000245235}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6865394431489954, "4": 0.260671939252011, "3": 0.04640609827710488, "2": 0.003540651603463614, "1": 0.002728847281944748}, "score": 4.6249361303733565}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8638084207569369, "4": 0.1260095224356734, "3": 0.009292348122696378, "1": 0.00044417008258458584, "2": 0.00038687148507298677}, "score": 4.852459830777001}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8811395905710763, "4": 0.10506182422055849, "3": 0.011547341981159432, "1": 0.0013558963912715428, "2": 0.0007654351977073598}, "score": 4.864105946439791}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.36068881525331703, "3": 0.24424144848317408, "5": 0.20429686956747758, "2": 0.11279677846877438, "1": 0.07781718385610671}, "score": 3.5009310083341543}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3732963913493372, "4": 0.3545716988517219, "3": 0.17749722570851437, "2": 0.05612204413795822, "1": 0.03840800029779635}, "score": 3.968327762299502}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6226901596142467, "4": 0.2525882213006356, "3": 0.10186370344488926, "2": 0.01451509698237696, "1": 0.008243790736580136}, "score": 4.467111147040757}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5129483762328847, "4": 0.3184616243265238, "3": 0.12091521275961706, "2": 0.027077680181172507, "1": 0.02052247196098633}, "score": 4.276331011065535}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4238941928740981, "5": 0.2583337307270048, "3": 0.21666261606931908, "2": 0.06539490034077854, "1": 0.035617581524023376}, "score": 3.804009562552324}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3200467820395673, "4": 0.21287856355717463, "2": 0.16061808095933303, "5": 0.15671103671013048, "1": 0.14969908497001272}, "score": 3.066287465247754}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8567873964349791, "4": 0.10530339701617773, "3": 0.02863381262097703, "1": 0.005427836277756832, "2": 0.003766133125734766}, "score": 4.804403306885929}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4165788998090488, "4": 0.26350587901427286, "3": 0.2023975998677614, "1": 0.061638944025248124, "2": 0.05576660865026167}, "score": 3.917722029785338}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6128004660687443, "4": 0.2583116441372427, "3": 0.09273246054622845, "1": 0.018600585876918457, "2": 0.017395716173471812}, "score": 4.429543167545227}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5524348340319838, "4": 0.24290644737395298, "3": 0.11700193568558472, "1": 0.047698286698660185, "2": 0.03982574964043872}, "score": 4.212714776126329}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.29163851673553715, "2": 0.23372122967331277, "3": 0.22500215478530422, "4": 0.1649831716966721, "5": 0.08450143183243715}, "score": 2.516913620739687}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4087827817444904, "5": 0.3372884432592577, "3": 0.18575215385511526, "2": 0.04425392548223013, "1": 0.023858362360975598}, "score": 3.9914528014872874}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.45166193970003005, "5": 0.27797547183317073, "3": 0.21469342471939962, "2": 0.0407755272435293, "1": 0.014839920476257757}, "score": 3.9372078582535193}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3790083130391587, "5": 0.36314248538936533, "3": 0.18282952823370496, "2": 0.04591266839984532, "1": 0.02905169063381982}, "score": 4.0013326221675785}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.41226564829384976, "5": 0.2961959945584501, "3": 0.21418595343203548, "2": 0.047720748339093184, "1": 0.029553839832551554}, "score": 3.897899079911932}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.24869033276446267, "4": 0.24384997484103982, "1": 0.22053342682642324, "2": 0.19436261793885143, "5": 0.09233038438883458}, "score": 2.793032994232592}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.41098057433279156, "4": 0.33772247522002324, "3": 0.15876296107105364, "2": 0.05162888377614298, "1": 0.040569213021189626}, "score": 4.027261363535581}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6125936011712482, "4": 0.2925698024282692, "3": 0.07490360940254143, "2": 0.01184814930963394, "1": 0.007873593605478513}, "score": 4.490476522596169}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7449378700397569, "4": 0.2114832034418586, "3": 0.036185474412488434, "2": 0.00423908641972763, "1": 0.003038971935108883}, "score": 4.69123707142103}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6215856908883786, "4": 0.2541483061185715, "3": 0.0806748258264217, "1": 0.022693008443945506, "2": 0.02072288155651478}, "score": 4.431461706316901}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3532109883120474, "4": 0.23358024482273496, "2": 0.17501660917339384, "1": 0.13291775838899614, "5": 0.10507824666706492}, "score": 3.002885178140776}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4298577065753528, "4": 0.3215202343371053, "3": 0.17531772145642224, "2": 0.04252005210864866, "1": 0.030612204796020014}, "score": 4.077676633165037}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.35783463954597394, "2": 0.22503656024500127, "4": 0.1814670108862019, "1": 0.1620358292490212, "5": 0.07339248740723481}, "score": 2.7790921910224}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6817719235620763, "4": 0.21775907236157474, "3": 0.07611851084507136, "2": 0.012399630564505644, "1": 0.011737047345559023}, "score": 4.545759701337162}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3287257705353124, "3": 0.2920709870277429, "5": 0.16779232918978454, "2": 0.11774699106502574, "1": 0.09340955846106981}, "score": 3.3598358501135235}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5633713932686403, "2": 0.24798614532566882, "3": 0.1279784997339135, "4": 0.04464969958061309, "5": 0.015967202568619502}, "score": 1.7017940799041382}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.3113232554563114, "3": 0.2740619234870163, "2": 0.23401686349573295, "4": 0.1223354521155526, "5": 0.05813685958593812}, "score": 2.3818681311691607}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3587592960175431, "3": 0.2576437917939626, "5": 0.21289665900412258, "2": 0.09547259843969615, "1": 0.07509368587337376}, "score": 3.5389648483517497}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.29442078305586267, "5": 0.2584543232172038, "3": 0.23825737072270586, "1": 0.1078152246456713, "2": 0.10100041027706193}, "score": 3.4947242402135594}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.6139944315579373, "2": 0.2469700264802722, "3": 0.10450808940491142, "4": 0.027931281989190492, "5": 0.006488146385004013}, "score": 1.5657937562057647}]