[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5440459330157336, "4": 0.4488946281330412, "3": 0.0069675027773029845, "2": 1.4075392471906465e-05, "1": 0}, "score": 4.537092097810224}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.861301139661725, "4": 0.13763704050381287, "3": 0.0010415488446450028, "2": 1.192996915918241e-06, "1": 0}, "score": 4.860273617117209}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5805568034525552, "4": 0.41469635552036305, "3": 0.004682158768906527, "2": 2.733611306590255e-06, "1": 0}, "score": 4.575904853987465}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7882471312142495, "4": 0.20990784036387625, "3": 0.000696455609809109, "2": 3.436225569933457e-07, "1": 0}, "score": 4.788455315767514}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5212435708739308, "5": 0.4779132730912345, "3": 0.0008410565995152008, "2": 1.8587023035480092e-06, "1": 9.052045406584961e-08}, "score": 4.477068299187403}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5839578344761582, "3": 0.20861012494197823, "5": 0.19163892048863768, "2": 0.013649595383840425, "1": 0.0021335131324502414}, "score": 3.949328558080588}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5540949594355311, "5": 0.23640458465608188, "3": 0.1924053758755048, "2": 0.014301755314265684, "1": 0.0027886072537251054}, "score": 4.0070299095542214}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6375846987439139, "5": 0.24152120605331115, "3": 0.11684460375758662, "2": 0.003620152959614425, "1": 0.0004257532520703638}, "score": 4.116159453079047}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6685714146155068, "5": 0.23631398814271412, "3": 0.09133161274481905, "2": 0.0034241945596132986, "1": 0.0003559408473668768}, "score": 4.137066554251515}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.47370600136815233, "5": 0.38266293980641636, "3": 0.13467877235554515, "2": 0.007864059736250387, "1": 0.0010564758285159861}, "score": 4.229093894431328}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.41207712110577494, "4": 0.18390673957517847, "3": 0.1714820641604582, "1": 0.16777508102491467, "2": 0.06467738337652162}, "score": 3.607883046156034}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5182102349936835, "3": 0.23651023382477293, "5": 0.19877071588727208, "2": 0.03804807832089044, "1": 0.008431096873097253}, "score": 3.860866910882713}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6521593793969036, "4": 0.19948702148129624, "3": 0.11038845774677115, "1": 0.022142257325741595, "2": 0.015767538148352977}, "score": 4.443833637748747}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.409263531146305, "4": 0.22405269707411749, "3": 0.2062967938970005, "1": 0.10661626490960661, "2": 0.053647253721718025}, "score": 3.775795754988833}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8847731451473546, "4": 0.058433974684937, "3": 0.0372255918975448, "1": 0.013426216878180497, "2": 0.005949673112556139}, "score": 4.795521817897348}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6885998127543391, "3": 0.1591190205297378, "5": 0.15003376653290776, "2": 0.0020578473876104518, "1": 0.00018445961635250418}, "score": 3.986245602325281}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5531747631444238, "3": 0.42627487257701013, "5": 0.011478238966366646, "2": 0.008779243822887013, "1": 0.00026288864986047264}, "score": 3.5668432211922765}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5846308596883754, "4": 0.3996307033296995, "2": 0.011656515324191288, "5": 0.0037241114221355275, "1": 0.0003519331553405851}, "score": 3.394720864345297}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5610876987048117, "4": 0.4233115441644235, "2": 0.009233523121436365, "5": 0.00611699387518376, "1": 0.0002433467930781296}, "score": 3.425828250586566}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7123450031094417, "3": 0.24546156550291592, "5": 0.03898029566062938, "2": 0.0030717476876384415, "1": 7.375055775450446e-05}, "score": 3.787139585766818}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5416127913262615, "5": 0.4155763612433316, "3": 0.04221172723425234, "2": 0.0004995571759800107, "1": 7.806607300851897e-05}, "score": 4.372139321297421}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6511950927666166, "4": 0.33590412567136707, "3": 0.012637091747551133, "2": 4.1904723696664645e-05, "1": 0}, "score": 4.638615827040839}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9388255817146828, "4": 0.05968104578697286, "3": 0.0014514691915131178, "2": 4.992988148857955e-06, "1": 0}, "score": 4.9373987262325905}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8067463035203591, "4": 0.18759980159622328, "3": 0.005604494017216952, "2": 1.8865418893448672e-05, "1": 0}, "score": 4.801128541483721}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7387038149871787, "5": 0.15502039346122154, "3": 0.10522546975969961, "2": 0.0009408371442886115, "1": 6.580188977898834e-05}, "score": 4.047717928194309}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6357503526378493, "3": 0.27185819242926823, "5": 0.08140243438265561, "2": 0.010744928534035605, "1": 0.00021832931843795555}, "score": 3.787393919623813}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6349745243678413, "5": 0.27196905161143037, "3": 0.09094821503445354, "2": 0.001948001117688294, "1": 8.00594559461003e-05}, "score": 4.176898834134516}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.614645721355592, "3": 0.32190255611419555, "5": 0.04389792177494751, "2": 0.018958204234710608, "1": 0.0005376059505958005}, "score": 3.682447724302084}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.692381807899883, "5": 0.2360478122963399, "3": 0.07064093405674496, "2": 0.0008765042541933402, "1": 3.584842230915e-05}, "score": 4.163549120020924}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5498384341507156, "5": 0.42722908960916806, "3": 0.022750191864871844, "2": 0.00014574879505091347, "1": 0}, "score": 4.404202167914915}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.879717936142917, "3": 0.0601351770509037, "5": 0.059939815210876414, "2": 0.0002025307157913752, "1": 0}, "score": 3.9993995740019277}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8605920382627439, "3": 0.12500199272586315, "5": 0.01304274811072073, "2": 0.0013508760109154521, "1": 1.0670079946881537e-05}, "score": 3.8853068010338907}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.604042088818962, "5": 0.3912968499560252, "3": 0.004642419985982974, "2": 6.469058356481006e-06, "1": 0}, "score": 4.38664619818071}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7175194311305584, "5": 0.2783644368169267, "3": 0.004105426269229823, "2": 7.270787139474634e-06, "1": 0}, "score": 4.274245411005348}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8158338744313662, "5": 0.1673987982274538, "3": 0.016720847246029083, "2": 4.082091440202227e-05, "1": 0}, "score": 4.150597161409177}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7795729961751616, "5": 0.17322383098960872, "3": 0.045672861396666306, "2": 0.0013064460073948963, "1": 0.00022115295317940174}, "score": 4.124274955811697}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6275029856371671, "5": 0.31417349934070476, "3": 0.05387828812166132, "2": 0.003319001481085159, "1": 0.001115481643585313}, "score": 4.250313452637733}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5621645940454926, "5": 0.42594970630471707, "3": 0.01171257181444876, "2": 0.00013999665898956198, "1": 2.492779779176267e-05}, "score": 4.413885753040426}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5362058570412538, "5": 0.4423295661370547, "3": 0.021164094263401413, "2": 0.00025114929370898177, "1": 3.927116591903855e-05}, "score": 4.4205495913999595}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7719148522911095, "3": 0.10999361063643993, "5": 0.10825733008293983, "2": 0.008977205828879129, "1": 0.0008528430713701785}, "score": 3.977750686059997}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9536853306782959, "4": 0.045408616554214326, "3": 0.000871185787660148, "2": 1.7443822211374633e-05, "1": 1.2301762661994418e-05}, "score": 4.952747231353093}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9186382210684101, "4": 0.07546828327968957, "3": 0.005257391435782765, "1": 0.00038314214571541743, "2": 0.00021167425457423874}, "score": 4.911845702803775}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8949334464326523, "4": 0.10409797041968742, "3": 0.0009292200310435088, "2": 2.6199587096264892e-06, "1": 0}, "score": 4.894031836037116}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9881174586769598, "4": 0.011768556588759568, "3": 0.00010348654020956476, "1": 5.738653787087693e-07, "2": 0}, "score": 4.988022055996254}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6687010765558445, "4": 0.32215612200266924, "3": 0.00899086695198212, "2": 7.460724033762452e-05, "1": 0}, "score": 4.65961200110475}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9565118129453453, "4": 0.04288648661455354, "3": 0.000517292541081696, "2": 6.742559839457941e-07, "1": 0}, "score": 4.956073227386634}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9032390246347317, "4": 0.09539008850526975, "3": 0.0012014988018500797, "2": 7.784461652174068e-07, "1": 0}, "score": 4.902188086523755}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9790407276892817, "4": 0.020670370105625887, "3": 0.0002241699698218937, "2": 1.8857444016063772e-07, "1": 0}, "score": 4.97887936102805}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9836139491601127, "4": 0.016061027398505387, "3": 9.881363071737167e-05, "2": 1.0427199659618511e-07, "1": 0}, "score": 4.983737355450064}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9374601956615024, "4": 0.06155544288258915, "3": 0.0009619221843686233, "2": 1.2872337782036651e-06, "1": 0}, "score": 4.936515508220971}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8560700603383075, "4": 0.14059284358667717, "3": 0.003281271103835232, "2": 1.23079273892233e-05, "1": 0}, "score": 4.852801284770548}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9901272319400067, "4": 0.009826757075649954, "3": 3.9261447508176595e-05, "1": 0, "2": 0}, "score": 4.990094653172831}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7772564356902785, "4": 0.21954490254165854, "3": 0.0031069724987325136, "2": 4.729571270759123e-06, "1": 0}, "score": 4.774207328884561}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9481078949167725, "4": 0.05119340314817917, "3": 0.0006765531143390815, "2": 1.606208701117436e-06, "1": 0}, "score": 4.94744759243332}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6195610534403614, "4": 0.3696718347536478, "3": 0.010707412717899102, "2": 3.98079068831286e-05, "1": 1.5077771271109973e-05}, "score": 4.6087317216702015}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7526008435317122, "5": 0.204417338076692, "3": 0.04264746261562729, "2": 0.0003097500116016931, "1": 1.7237729516166146e-05}, "score": 4.161099849238616}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7975020450503242, "5": 0.12621057964746185, "3": 0.07543310062267024, "2": 0.0008110896235732103, "1": 3.613375817808068e-05}, "score": 4.049047244349837}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6286136751020437, "5": 0.3167627525423021, "3": 0.054053185525046885, "2": 0.00042013855845874937, "1": 0}, "score": 4.261908641221142}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6997513999118556, "3": 0.2332323294755295, "5": 0.061830840610017125, "2": 0.0049429710571258405, "1": 0.0002199898827872596}, "score": 3.818048511092464}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.48344607539424994, "3": 0.4589886761146975, "5": 0.037980709229873844, "2": 0.01872694281164524, "1": 0.0008023962458331809}, "score": 3.539105517285056}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8838052730188528, "4": 0.11059884864825849, "3": 0.00549598364426958, "2": 6.128747860986475e-05, "1": 2.9686593837609308e-05}, "score": 4.878105487877866}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9736840314484367, "4": 0.024959843638093282, "3": 0.0013003861762161712, "1": 2.6302488591660494e-05, "2": 2.1939497648142327e-05}, "score": 4.97226814766337}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8205707288781751, "4": 0.17067676063738837, "3": 0.008501709653543, "2": 5.6112609635864455e-05, "1": 0}, "score": 4.812114903211324}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9851214494270731, "4": 0.01456419149847356, "3": 0.0003011093711235257, "2": 3.5685007798432655e-06, "1": 0}, "score": 4.984822737322787}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9825056977685644, "4": 0.016882710973737378, "3": 0.0005807149158115069, "2": 8.460138612703903e-06, "1": 0}, "score": 4.981930073719662}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.709665561543913, "3": 0.17820168648305568, "5": 0.10764449440003321, "2": 0.00407714455318881, "1": 0.00038644333936418333}, "score": 3.920127218356508}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6640850834425203, "5": 0.30867630740447594, "3": 0.026965254825656877, "2": 0.00013147024575128452, "1": 0}, "score": 4.281488050760879}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7465423441760708, "3": 0.20138572098391816, "5": 0.04494517793566445, "2": 0.006761314196876828, "1": 0.00034717648673805365}, "score": 3.828992175431108}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8709904034877781, "5": 0.08518657738394, "3": 0.04351419814519784, "2": 0.0002592955570413807, "1": 0}, "score": 4.041155826384495}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6879455958327104, "3": 0.26492431435412106, "5": 0.04126519790483507, "2": 0.005575016511144895, "1": 0.00027346169520658394}, "score": 3.7643665978263647}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7327511572997683, "4": 0.24734137785291682, "3": 0.01961667517920255, "2": 0.00023594637578672802, "1": 4.102300709444469e-05}, "score": 4.7125493679832156}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9166445450074261, "4": 0.08059294212428156, "3": 0.0027301410621580783, "2": 1.977778934794745e-05, "1": 0}, "score": 4.913886357866703}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7588845660830393, "4": 0.23675462777758027, "3": 0.00431318227690937, "2": 2.6249306193493383e-05, "1": 0}, "score": 4.754535013044842}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8659072740480784, "4": 0.13043357312661286, "3": 0.003625628595693425, "2": 2.0583577682092127e-05, "1": 6.355239291371781e-06}, "score": 4.86222709070033}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6940368443798781, "4": 0.2977895648932884, "3": 0.008080560823571158, "2": 6.138537152349159e-05, "1": 0}, "score": 4.685855216380423}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8541556772029215, "3": 0.09689522876974532, "5": 0.047806230633409906, "2": 0.0010600438540167836, "1": 6.447716034823525e-05}, "score": 3.948596539812809}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5589755754909224, "4": 0.43608521826310415, "3": 0.004741427634074633, "2": 7.682073962963645e-06, "1": 0}, "score": 4.554324158812405}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.684362897603955, "5": 0.29437674100114536, "3": 0.021105989842386177, "2": 0.00013395602279176854, "1": 1.5172135549341503e-05}, "score": 4.272958753936866}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6092511980771814, "5": 0.37127312546143765, "3": 0.019332348462426967, "2": 0.00011607268131572486, "1": 1.820567862836117e-05}, "score": 4.351657196971183}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6508067446900748, "4": 0.3443287876573777, "3": 0.004812555726032263, "2": 1.9901409491967093e-05, "1": 0}, "score": 4.645975064140846}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9151068358781744, "2": 0.05814840671284364, "3": 0.020448014329697856, "4": 0.0032639061348469223, "5": 0.0030294284730746713}, "score": 1.1209542799382783}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8518466726723788, "4": 0.11399006312009341, "3": 0.026742233078662907, "1": 0.004693315578113097, "2": 0.00272238212689715}, "score": 4.805584025126639}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6386765080334394, "4": 0.2567378380850944, "3": 0.06716058071977173, "1": 0.026070316779452065, "2": 0.0113428011068353}, "score": 4.470625001213143}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9614945578805019, "4": 0.03460688943918896, "3": 0.003039053076742787, "1": 0.0006109905899347902, "2": 0.00024472657280779047}, "score": 4.956136696418812}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7746107452494188, "1": 0.12434839698124663, "4": 0.054731273791336896, "3": 0.030910170711397452, "2": 0.015392390731784196}, "score": 4.33987298890061}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6844887977382791, "2": 0.12426063799554504, "3": 0.07951572326173095, "5": 0.0636377583530994, "4": 0.04809222294875154}, "score": 1.6821231016930662}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7025790060287388, "4": 0.16909883711642112, "1": 0.07433828381497262, "3": 0.03975916096127711, "2": 0.014221684524279998}, "score": 4.411362869997414}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5872033128049162, "4": 0.3170395973911461, "3": 0.07069415378155512, "1": 0.014934982485945809, "2": 0.010110720322211756}, "score": 4.451490551554497}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8325630868489154, "4": 0.08500074141503822, "3": 0.03978968385153388, "1": 0.03336533474026457, "2": 0.009268826486763844}, "score": 4.6741480557952375}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.3264337697500189, "4": 0.27490472387021353, "3": 0.18732861591912586, "1": 0.13579471257479075, "2": 0.07552608392063058}, "score": 3.5806637768275618}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6275024648099051, "3": 0.3225414577001712, "5": 0.04185538150462744, "2": 0.007746751382093308, "1": 0.0003003818678247703}, "score": 3.702903362128199}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7263768512321448, "4": 0.2555850622724813, "3": 0.01767678645302555, "2": 0.00010902318412039168, "1": 0}, "score": 4.708660797130327}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7068097316686611, "4": 0.2851795776852825, "3": 0.007936187363232271, "2": 4.5284262138441754e-05, "1": 0}, "score": 4.69880339413198}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5902485261573379, "4": 0.39481503088384734, "3": 0.014822593120910839, "2": 8.387030000083886e-05, "1": 0}, "score": 4.575275438928252}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6618738897893234, "5": 0.30355784304581995, "3": 0.034321836318841815, "2": 0.00019049721174763261, "1": 0}, "score": 4.26887005118259}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.48944618586546207, "3": 0.3629853513279525, "4": 0.0851536250721859, "1": 0.05295362227108633, "5": 0.009459790897698607}, "score": 2.5087190765980374}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4667717727898313, "4": 0.409324413624585, "3": 0.11497400725910417, "2": 0.007900830487771843, "1": 0.001025252864236832}, "score": 4.332921585421037}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5839197266313528, "5": 0.21704095728556333, "3": 0.19389854900006073, "2": 0.004799396971010552, "1": 0.000340006269778191}, "score": 4.0125236126143795}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5502001598285362, "5": 0.308990081903253, "3": 0.1358343975875031, "2": 0.004515488062268409, "1": 0.0004566222935226168}, "score": 4.162755370318481}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5892747944916419, "5": 0.2764974446042687, "3": 0.12794863303765466, "2": 0.00553232011943548, "1": 0.0007400067131373333}, "score": 4.13526507113066}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5400280642180955, "5": 0.3860334172801182, "3": 0.07320511378530593, "2": 0.0006656894416540963, "1": 5.711875707849295e-05}, "score": 4.311328867342137}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9097638305702865, "4": 0.085172096896661, "3": 0.005018192850653918, "2": 2.8074047075986443e-05, "1": 0}, "score": 4.9047055984834405}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7522374852758998, "4": 0.23806031810607906, "3": 0.009652686582947632, "2": 2.441048023630906e-05, "1": 0}, "score": 4.7425546155227725}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9482342425041754, "4": 0.0511592276060404, "3": 0.0005159663540180765, "2": 1.181072067703416e-06, "1": 0}, "score": 4.947800630761495}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5678469220594607, "5": 0.3974309780860584, "3": 0.03457446068369401, "2": 8.88081618024557e-05, "1": 0}, "score": 4.362700239099785}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.47385252708003095, "5": 0.46444106831695287, "3": 0.06073230590555848, "2": 0.0008348413927152477, "1": 8.517300645281897e-05}, "score": 4.40180529196387}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8580756527610858, "5": 0.11763671380736136, "3": 0.023789832392124795, "2": 3.424452020743295e-05, "1": 0}, "score": 4.093821884120851}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6751403863207158, "5": 0.3028677613271929, "3": 0.02188116189010118, "2": 4.829227248809546e-05, "1": 0}, "score": 4.280907543014216}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6760054640889639, "4": 0.3199686361573938, "3": 0.0039929163511240925, "2": 5.608450947494673e-06, "1": 0}, "score": 4.672019727343435}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.626701429975301, "4": 0.35670794972497366, "3": 0.016316449634803058, "2": 0.0001838057618605571, "1": 0}, "score": 4.610072497958916}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5382676778938417, "5": 0.4527777599579812, "3": 0.008908581084112868, "2": 2.2868731892048278e-05, "1": 0}, "score": 4.443833699441974}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5670934919762812, "5": 0.41434404238887423, "3": 0.01845913332163665, "2": 8.136091987958228e-05, "1": 0}, "score": 4.3957308819863385}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6473439683298974, "5": 0.3381554425549245, "3": 0.01443961800232488, "2": 3.673009910254769e-05, "1": 0}, "score": 4.323650209963584}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5650242660482517, "5": 0.42802989401928343, "3": 0.00692725256262012, "2": 1.5555146647237525e-05, "1": 1.5775303553847762e-06}, "score": 4.421067411096052}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8122819906356077, "4": 0.18556606774393947, "3": 0.00211948742540747, "2": 2.8432522572054867e-06, "1": 0}, "score": 4.810180806923208}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7879138204627669, "3": 0.1524471805468455, "5": 0.0575931005829892, "2": 0.0016446647745496108, "1": 0}, "score": 3.9018171962440107}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5669286051645188, "5": 0.3874887356118626, "3": 0.04521170343980556, "2": 0.00027681005749502095, "1": 0}, "score": 4.341755586885018}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.643608774814629, "5": 0.2868454528709824, "3": 0.06881796148632505, "2": 0.0006018751055760368, "1": 0}, "score": 4.216851050467219}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5445917759172506, "5": 0.43467198057028084, "3": 0.0205985704752468, "2": 3.859136543154104e-05, "1": 0}, "score": 4.41403725086717}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7010470821062758, "3": 0.24374748185715137, "5": 0.044508744655632176, "2": 0.01046745875887418, "1": 0.0002196946346781585}, "score": 3.7791651550567322}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6329733555892069, "2": 0.2863917070917789, "4": 0.06484386341940887, "1": 0.014397705865326954, "5": 0.0013900591205141994}, "score": 2.7524360436702224}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.48312974413708554, "3": 0.42214300835329555, "1": 0.06206464970701145, "4": 0.0314079887386018, "5": 0.001226791075950879}, "score": 2.4265865761316197}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.44361338960529995, "2": 0.4103332272481442, "4": 0.11587851745014865, "1": 0.025201506613547527, "5": 0.004972476366937903}, "score": 2.6650869340756893}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6127903855839896, "4": 0.28830348105259784, "2": 0.06279085733147863, "5": 0.03161553074036827, "1": 0.004495321903233976}, "score": 3.279754278857201}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5609997607107973, "2": 0.24362663744674642, "4": 0.17320387675366478, "1": 0.015213394835736591, "5": 0.006947686864888035}, "score": 2.913045071780024}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5942657554056933, "5": 0.246962543401839, "3": 0.15427132132177374, "2": 0.003918066447726908, "1": 0.0005606762015008557}, "score": 4.0831748602529805}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8225123181340369, "4": 0.16473199473147646, "3": 0.012523066690164805, "2": 0.00017663431137841782, "1": 4.3368985158947864e-05}, "score": 4.809516089649776}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6483283033220213, "5": 0.25183924794470325, "3": 0.0980675551039817, "2": 0.0016232861446213765, "1": 0.0001222128941521394}, "score": 4.150161394187774}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5214852962755832, "4": 0.44687603922415425, "3": 0.03128204463100243, "2": 0.00029304511051380034, "1": 4.1530602202722635e-05}, "score": 4.489503360305648}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8748008662094767, "4": 0.11940876165747469, "3": 0.005729445066377528, "2": 4.452113667942504e-05, "1": 1.3267355680161993e-05}, "score": 4.868945304052109}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6038227405683565, "3": 0.28351169626463046, "5": 0.10085194789439757, "2": 0.010661433442574076, "1": 0.0011390580842359438}, "score": 3.792597488594072}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7719412753887321, "5": 0.11934364194100802, "3": 0.10713618465496706, "2": 0.0014433573298672198, "1": 0.00012337747495331033}, "score": 4.008950719070927}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7083329694567352, "4": 0.27624884697639196, "3": 0.015302938656107608, "2": 7.914182989678899e-05, "1": 0}, "score": 4.692896762848697}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7519669691497324, "4": 0.24118437415411303, "3": 0.006815148662897711, "2": 1.871530349627733e-05, "1": 0}, "score": 4.745125412318704}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6629035993809649, "4": 0.3087083496681492, "3": 0.02820712706974459, "2": 0.0001450904814727768, "1": 0}, "score": 4.634429025097092}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9647596751060271, "4": 0.03494979415567219, "3": 0.0002813857652581609, "2": 1.956426427779853e-06, "1": 0}, "score": 4.964481309706768}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9400916955670928, "4": 0.05941782579944927, "3": 0.0004544521183779375, "2": 1.0632683973747321e-06, "1": 0}, "score": 4.939667970754981}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9595374246210815, "4": 0.04015079652726402, "3": 0.0002468052484880815, "2": 5.731427636746696e-07, "1": 0}, "score": 4.959351255749624}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9810868070533344, "4": 0.018807472776725745, "3": 8.908255802015795e-05, "2": 2.4087059448757487e-07, "1": 0}, "score": 4.981013328175903}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9015689965435965, "4": 0.09803472758216672, "3": 0.00037018043834361435, "2": 1.0369093999373882e-06, "1": 0}, "score": 4.901219325514798}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7033950121676666, "5": 0.20400658627445462, "3": 0.09083559997546138, "2": 0.0016992980924080384, "1": 6.132585658252671e-05}, "score": 4.109588651188339}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6824323484406026, "3": 0.23673646939401266, "5": 0.06895470770422468, "2": 0.011478954082929899, "1": 0.00039682372242633775}, "score": 3.8080697252677336}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7350936447954718, "5": 0.15778554153842372, "3": 0.1039566285496215, "2": 0.0030584133823094843, "1": 0.00010503856389975808}, "score": 4.047397005282559}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6407755111604396, "4": 0.3463178790903164, "3": 0.012828735028913294, "2": 7.35304464575846e-05, "1": 2.848166796336743e-06}, "score": 4.62779210998244}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5195499878859029, "5": 0.46687426378308444, "3": 0.01351588254822866, "2": 5.0981792438161163e-05, "1": 7.569390567730794e-06}, "score": 4.453234305299994}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6778236012775599, "5": 0.2871224497592873, "3": 0.034869526409148, "2": 0.00017279148144547557, "1": 1.0093791763394332e-05}, "score": 4.2518774462183195}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5744409339194054, "5": 0.3944804091021129, "3": 0.030926279106210566, "2": 0.00011362670500893816, "1": 0}, "score": 4.363340956472062}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7624060204237416, "5": 0.2022110146184175, "3": 0.03522610682906703, "2": 0.00011500430448467479, "1": 0}, "score": 4.166761878802755}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5290903858493714, "5": 0.4534777833193283, "3": 0.017377986802545712, "2": 4.356532596679227e-05, "1": 6.47182770605611e-06}, "score": 4.435994910159891}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7237726899868718, "5": 0.24256205607537742, "3": 0.0335316671028817, "2": 0.00011877091550384438, "1": 8.368507539960966e-06}, "score": 4.208769087639153}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6883017342275972, "3": 0.29224686669640226, "5": 0.01612979655109323, "2": 0.0032512663902474074, "1": 4.925335848905614e-05}, "score": 3.7172266753520185}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8141834254286807, "3": 0.1357526227381543, "5": 0.048497986372179086, "2": 0.0014871406939621532, "1": 7.612179002367167e-05}, "score": 3.9095424723714127}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6390621614956593, "3": 0.3414643151047651, "5": 0.011515411619201523, "2": 0.00784627015180501, "1": 0.000110530837891471}, "score": 3.6540265101983267}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7953695178403778, "5": 0.17843283911845534, "3": 0.026060834123207453, "2": 0.00012546233047824033, "1": 6.948255062881066e-06}, "score": 4.152100904559441}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8579235723301603, "5": 0.0943351983224299, "3": 0.047575340914152844, "2": 0.0001577099455056544, "1": 6.025060723796021e-06}, "score": 4.046426462311094}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5975782149868122, "4": 0.3697885585757654, "3": 0.03175904221551991, "2": 0.0006858644119448053, "1": 0.0001792630997970053}, "score": 4.563914761860564}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7848765223041057, "5": 0.178683910007562, "3": 0.03588848812333889, "2": 0.0005178850248968878, "1": 2.8989177131418863e-05}, "score": 4.1416732800905995}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4951179311706687, "5": 0.4653225769649171, "3": 0.039028177255292056, "2": 0.00046648159118949214, "1": 4.5963589845242345e-05}, "score": 4.425231569634233}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6354128905837828, "4": 0.3517848893460881, "3": 0.012668876026361558, "2": 0.00010410807663524096, "1": 1.529923088169016e-05}, "score": 4.622498576309981}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7714388897289284, "4": 0.22250813861496857, "3": 0.005993820243160927, "2": 4.544807920272806e-05, "1": 8.706784575096666e-06}, "score": 4.765331876991986}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5181704690660882, "3": 0.2498359691157845, "5": 0.18642454615863593, "2": 0.03815737210295179, "1": 0.007363050220216355}, "score": 3.8381768186480225}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4077964606546381, "1": 0.3006684549133299, "3": 0.19842823118003958, "4": 0.07639562873171522, "5": 0.016663493005903727}, "score": 2.1005463119755863}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5267254415373942, "3": 0.25953731265189695, "5": 0.12455635685468704, "2": 0.06729520452976595, "1": 0.021817322819205072}, "score": 3.6649537623864035}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.6668931105210176, "2": 0.12608320913901414, "3": 0.07624961596743156, "5": 0.07511760702156503, "4": 0.05563537717166603}, "score": 1.7459747259561162}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.31977495379145426, "3": 0.297881179052985, "5": 0.20513782677945466, "2": 0.12591210434745223, "1": 0.051232406894758234}, "score": 3.5017045586603603}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.825836588317322, "3": 0.08996672493146388, "5": 0.08338386946621212, "2": 0.0007399321982132098, "1": 4.156076436746273e-05}, "score": 3.9918123413723605}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5003375041377819, "5": 0.4706748985090015, "3": 0.028712336654102347, "2": 0.00022337513055930395, "1": 3.318827191578218e-05}, "score": 4.441424500222858}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5084409480155682, "4": 0.4759827047355571, "3": 0.015423263384531623, "2": 5.326873416191405e-05, "1": 0}, "score": 4.492960352064428}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5586958782154712, "4": 0.42520694464181075, "3": 0.01598865293340357, "2": 6.577754758335399e-05, "1": 0}, "score": 4.542598864477017}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8037891945627329, "4": 0.1883062786516484, "3": 0.0077494887928917485, "2": 9.944229816071128e-05, "1": 0}, "score": 4.795885068956723}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5931815510066263, "3": 0.20396219927076248, "5": 0.1626289586902385, "2": 0.022011956411542317, "1": 0.018180385242514047}, "score": 3.860096801339031}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.751489155774757, "4": 0.2435896577300135, "3": 0.004888778999635492, "2": 2.2151773432620665e-05, "1": 8.877221003460854e-06}, "score": 4.746530470658364}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6394034542760102, "4": 0.34882790056304813, "3": 0.011627615076379123, "2": 6.620775214427077e-05, "1": 0}, "score": 4.627690388954281}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9398379736807178, "4": 0.05945848149495886, "3": 0.0006940938333783583, "2": 3.2042099610203167e-06, "1": 0}, "score": 4.939143338050163}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7896448749244467, "4": 0.20695760778478473, "3": 0.003316785128439996, "2": 1.4284578916998072e-05, "1": 0}, "score": 4.786351771813122}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"5": 0.725296806230274, "4": 0.26834062947802656, "3": 0.00631303143627191, "2": 2.8220228908576103e-05, "1": 0}, "score": 4.718942656892519}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7792616501353942, "5": 0.1535599092229622, "3": 0.06675552590731254, "2": 0.0003681900179259739, "1": 3.6040761361119834e-05}, "score": 4.085961487096275}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6765255663457712, "5": 0.24815557771750152, "3": 0.07453881370019863, "2": 0.0007021896736841936, "1": 6.849676774594381e-05}, "score": 4.172008503643013}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7647730621113504, "4": 0.23023789005417858, "3": 0.0049558003526281365, "2": 2.259746107072925e-05, "1": 0}, "score": 4.7597801585110515}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8439842294892772, "4": 0.15286128543073332, "3": 0.0031380992397877323, "2": 8.145401687993837e-06, "1": 0}, "score": 4.840836768309803}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8499681931682262, "2": 0.07392117176315968, "3": 0.042607852998842746, "4": 0.017572290869414458, "5": 0.01591799577533916}, "score": 1.275529176324608}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.40340744419526653, "4": 0.38110165058666956, "3": 0.12190825808983831, "1": 0.05372096199022514, "2": 0.03979658398093767}, "score": 4.040745784770611}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9131355671793628, "2": 0.07438902957233114, "3": 0.007236149869597608, "5": 0.0031234088295848247, "4": 0.0021138232590916894}, "score": 1.10769665209331}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5298143430161273, "4": 0.30624957649427287, "3": 0.12070472560355835, "2": 0.021997648889363047, "1": 0.02121222738764902}, "score": 4.301484112930287}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8734086623636091, "5": 0.0777035759612683, "2": 0.0248169001558754, "3": 0.015055197478459431, "4": 0.009005966291530514}, "score": 1.3927633067525254}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8716029250175216, "4": 0.12539205625984545, "3": 0.002944700985413386, "2": 3.1423422614199184e-05, "1": 1.4675310999565806e-05}, "score": 4.868563701364281}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9744619923513516, "4": 0.025255836536788128, "3": 0.0002783136062616435, "2": 1.9040316477800875e-06, "1": 0}, "score": 4.974181773720512}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8885950402754618, "4": 0.1096472702005455, "3": 0.001729928155409183, "2": 1.7883322201957475e-05, "1": 7.617967165788855e-06}, "score": 4.8868084958316}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9612302447489989, "4": 0.03855642986556966, "3": 0.00020925195620258253, "2": 1.448595632745844e-06, "1": 0}, "score": 4.9610206181207355}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8930096374023386, "4": 0.10549428480477337, "3": 0.0014767316172009978, "2": 9.604277363734041e-06, "1": 0}, "score": 4.891522382350812}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5257083698187238, "5": 0.43869820607600113, "3": 0.03520978331181912, "2": 0.00033591866357461246, "1": 2.4001433505601394e-05}, "score": 4.40275413474506}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9008577175433252, "4": 0.0980841299213269, "3": 0.0010326007078668782, "2": 5.098240896440144e-06, "1": 0}, "score": 4.8998333251724935}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9157564719241021, "4": 0.08330041898417173, "3": 0.00092648287124764, "2": 1.945302628379553e-06, "1": 0}, "score": 4.91483952913157}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9575810595663812, "4": 0.04204477319715369, "3": 0.0003279343900251528, "2": 5.658153775660324e-07, "1": 0}, "score": 4.957295710398544}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9732082294848138, "4": 0.026712392037291848, "3": 7.743559495057843e-05, "2": 1.4217829050123766e-07, "1": 0}, "score": 4.973132261857075}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5762681029886726, "5": 0.41446909785859143, "3": 0.009219695204871788, "2": 1.0729366962855839e-05, "1": 0}, "score": 4.405241063429386}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8999065899398454, "4": 0.09935930058724846, "3": 0.000577223741338713, "2": 1.280378270324829e-06, "1": 0}, "score": 4.899466767286068}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8508534792728913, "4": 0.14640252944125223, "3": 0.0026679577150130213, "2": 8.136308353880916e-06, "1": 0}, "score": 4.848226841221659}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.916177028890496, "4": 0.08274092817829574, "3": 0.0010448593457425006, "2": 2.976468581282425e-06, "1": 0}, "score": 4.915157521507898}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8097270203747048, "4": 0.18883961916752104, "3": 0.001385922910349146, "2": 3.4981580479951737e-06, "1": 0}, "score": 4.808369620415771}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7568432305924946, "3": 0.218865279621674, "5": 0.02360572527438662, "2": 0.0006679514945588021, "1": 1.6859976486901324e-05}, "score": 3.8033537753223374}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7429357587358069, "5": 0.2333260843875333, "3": 0.023691536602455186, "2": 3.944181539516425e-05, "1": 0}, "score": 4.20955716845179}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9051049003595364, "5": 0.06392202485941272, "3": 0.0309496063139088, "2": 2.1589790868129767e-05, "1": 8.903964713385036e-07}, "score": 4.032926600315049}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8064089443682864, "5": 0.16203999362334487, "3": 0.03151611426457562, "2": 3.0909561137379453e-05, "1": 0}, "score": 4.130462587068251}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9020595420105314, "5": 0.054565077887068776, "3": 0.04332157067518742, "2": 4.800329037147775e-05, "1": 0}, "score": 4.011147565355429}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5416158460310189, "4": 0.4088486951058539, "3": 0.04873492305689982, "2": 0.000650288920991262, "1": 7.826116930563935e-05}, "score": 4.49138093403255}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4998133251361534, "4": 0.45288753111904867, "3": 0.04647924547018497, "2": 0.0007205652388424447, "1": 8.914948414884681e-05}, "score": 4.451630099934273}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5364697191375382, "5": 0.4369944867931987, "3": 0.026356527808710842, "2": 0.00014653928623946236, "1": 2.076939601876567e-05}, "score": 4.4102874782685975}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8809493466397095, "4": 0.11402107263436487, "3": 0.004974989594159497, "2": 3.078974124278524e-05, "1": 0}, "score": 4.875933626001369}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6612593738205571, "4": 0.31845066943507216, "3": 0.020133825855241667, "2": 0.00011051956432096793, "1": 0}, "score": 4.640933742673791}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8148332890321064, "5": 0.1632450880161778, "3": 0.021744826756808097, "2": 0.00015238886220907662, "1": 1.6751864373611274e-05}, "score": 4.1411463084829245}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5985502485687436, "4": 0.39981857390639164, "3": 0.001599945040522184, "2": 2.016831182132479e-06, "1": 0}, "score": 4.596963710550574}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7298457270367489, "5": 0.2563182352690562, "3": 0.013729035627716525, "2": 4.059035829411697e-05, "1": 0}, "score": 4.2425241253661925}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5117455961239966, "4": 0.4847180486886316, "3": 0.003481474736871253, "2": 9.802706862182884e-06, "1": 0}, "score": 4.508267427522199}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8771750198386566, "5": 0.0918499969984341, "3": 0.03041302829624825, "2": 5.4387457029403715e-05, "1": 0}, "score": 4.061359337788264}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8377077385595457, "4": 0.1564494225233464, "3": 0.005709767352583792, "2": 9.181921210910889e-05, "1": 3.228234731141918e-05}, "score": 4.831724946317824}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8302982710798605, "4": 0.16678368593264958, "3": 0.002626947639890051, "2": 7.638853740561375e-06, "1": 0}, "score": 4.827890716732352}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8749218420373321, "4": 0.1237381425378652, "3": 0.00130186842027403, "2": 6.539250509867811e-06, "1": 0}, "score": 4.873634508740693}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9707877885095073, "4": 0.028686788305270085, "3": 0.0004038504184194966, "2": 3.659211027666771e-06, "1": 0}, "score": 4.970491053720025}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9816040015844197, "4": 0.017728690845561744, "3": 0.0006028798709935393, "1": 3.276004255459293e-05, "2": 2.4498834817841037e-05}, "score": 4.98086087553281}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7100179695796055, "5": 0.2640391213190022, "3": 0.025851258357642952, "2": 7.260193380904831e-05, "1": 9.728751349113216e-06}, "score": 4.238015691159882}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7529312325405025, "4": 0.24042555018525452, "3": 0.006618101716018275, "2": 1.5652874245213964e-05, "1": 4.518032258266772e-06}, "score": 4.746271961034156}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6549390179811697, "4": 0.32872659235076596, "3": 0.016250558525452114, "2": 7.007131842022236e-05, "1": 8.91295251893275e-06}, "score": 4.638524672808471}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8627220533953615, "4": 0.13407894643680002, "3": 0.0031727692246198273, "2": 1.1352075128993959e-05, "1": 0}, "score": 4.859539368993373}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8413260171213433, "4": 0.1538353045212749, "3": 0.004796359914057839, "2": 1.7950313105118986e-05, "1": 0}, "score": 4.83651414086659}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9695330249312638, "4": 0.02891607529285362, "3": 0.0015136197672405338, "2": 2.169063407575985e-05, "1": 1.2771275632445257e-05}, "score": 4.96794043782089}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7836357744382458, "4": 0.20598055661730955, "3": 0.010207587119042093, "2": 0.00013847441204264445, "1": 3.578710231504883e-05}, "score": 4.773045284371043}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9637367467019353, "4": 0.034929791124931955, "3": 0.0012894970762463017, "2": 2.604486317990899e-05, "1": 1.4745118191926478e-05}, "score": 4.962353980129806}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990879989959398, "4": 0.0008942304875215212, "3": 1.3860132560480806e-05, "1": 0, "2": 0}, "score": 4.999078045642162}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.659854534847442, "4": 0.27344458278748907, "3": 0.06299495091554629, "2": 0.002623546632700644, "1": 0.0010726961858727082}, "score": 4.588400102900325}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5327018991104123, "5": 0.45157942860126515, "3": 0.015586587658776468, "2": 4.2652784454623144e-05, "1": 0}, "score": 4.435946522875481}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6443869173173572, "5": 0.34104665257023214, "3": 0.014419901181885913, "2": 5.665292154360519e-05, "1": 0}, "score": 4.326542793908337}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8513451763628825, "5": 0.11919864403033836, "3": 0.02919940928144594, "2": 0.00014914419027372842, "1": 0}, "score": 4.089710601573667}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6479610645539268, "4": 0.3451602420753001, "3": 0.00663650373567374, "2": 2.7260439753576886e-05, "1": 0}, "score": 4.641407897221985}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5694846214836866, "4": 0.4250170258655574, "3": 0.005438244349902984, "2": 9.966361354826027e-06, "1": 0}, "score": 4.564054727209078}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7221386879229569, "4": 0.27537992205808354, "3": 0.0024736709922779684, "2": 3.265254011325455e-06, "1": 0}, "score": 4.71966169163223}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9966694595952095, "4": 0.0033136930051865373, "3": 1.6741029422846075e-05, "1": 3.6708775354184404e-08, "2": 0}, "score": 4.996652677867687}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9575856540513271, "4": 0.041999288555374, "3": 0.00041292317469265817, "2": 5.947777681954617e-07, "1": 0}, "score": 4.957173014832326}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.92121082051155, "4": 0.07852434302784521, "3": 0.000260991426458271, "2": 5.437669949236206e-07, "1": 0}, "score": 4.920951781858968}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8994837557087801, "4": 0.09987298003813491, "3": 0.0006405301917214664, "2": 1.2623581986575931e-06, "1": 0}, "score": 4.898842023629312}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5518113435789771, "3": 0.37430546634397277, "5": 0.04884524226580416, "2": 0.022256515094396762, "1": 0.002748684075032538}, "score": 3.6217683069337006}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8448560171913806, "4": 0.14399024856467385, "3": 0.010777334581118497, "2": 0.00012687921335630177, "1": 0}, "score": 4.834033032480687}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.49840350950038864, "5": 0.4494754692385611, "3": 0.05144891013086548, "2": 0.0005419653437443811, "1": 0}, "score": 4.396994295555014}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5476159274885798, "5": 0.41248955283035027, "3": 0.03952778249535487, "2": 0.0002467906874079768, "1": 0}, "score": 4.37251287057458}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5981327258958947, "4": 0.37391514213455534, "3": 0.027323763432906975, "2": 0.0002956654438873044, "1": 0}, "score": 4.570407407883947}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7402845571574154, "5": 0.13215630871827388, "3": 0.12530315973997788, "2": 0.002161810962477053, "1": 9.157822801148435e-05}, "score": 4.002254798198399}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7540645383564435, "5": 0.16131945296109226, "3": 0.08376201130443517, "2": 0.0007439929492430094, "1": 8.224812211565838e-05}, "score": 4.07582481600867}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7625216175631179, "5": 0.15398124033425684, "3": 0.08250704461617414, "2": 0.0008761236710453565, "1": 0}, "score": 4.069729895758259}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6535925394837737, "5": 0.3076888604321252, "3": 0.03843722069166926, "2": 0.00025009492804361274, "1": 0}, "score": 4.268759857892572}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5379526144122696, "5": 0.4362659519759684, "3": 0.025633338232854495, "2": 0.00012621661000455337, "1": 0}, "score": 4.4103891593326825}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7287084488196888, "3": 0.18541676571067628, "5": 0.07597828524364757, "2": 0.008998338768148305, "1": 0.0008938975380870008}, "score": 3.8698825945722386}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5479058025315782, "4": 0.36251957722781153, "3": 0.0860212431378982, "2": 0.003168286732910095, "1": 0.00038256269868502826}, "score": 4.454401446409216}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5597327731210499, "5": 0.3712387842856364, "3": 0.06780492815672336, "2": 0.0010728174073905983, "1": 0.00014916223781260562}, "score": 4.300841196329172}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6685582639451186, "3": 0.2707770744857141, "5": 0.042731838682667035, "2": 0.017415577755067576, "1": 0.0005142093909884782}, "score": 3.735580177803904}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5498443724378712, "3": 0.3935801448780816, "2": 0.03542836175838788, "5": 0.019221842814295523, "1": 0.0019231996415605295}, "score": 3.549014438134885}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9663801201983296, "4": 0.030235214223503126, "3": 0.003144359708057018, "1": 0.0001432202360819631, "2": 8.589490876975478e-05}, "score": 4.96264508266113}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9390940077831382, "4": 0.059741616956322234, "3": 0.001151522844493721, "2": 7.679055501062822e-06, "1": 3.43614621811307e-06}, "score": 4.937918447754353}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9849417121925688, "4": 0.014597126276765657, "3": 0.0004448881747829056, "2": 2.1168127931009087e-06, "1": 0}, "score": 4.98450652760128}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8437221033822949, "4": 0.14389576437861834, "3": 0.011387215502764034, "2": 0.0005687772936587459, "1": 0.0004199495386400919}, "score": 4.829942621941468}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8996521773208189, "4": 0.09283408605531492, "3": 0.0072859022254195905, "2": 0.00013310969436719158, "1": 9.115788999739147e-05}, "score": 4.891829763027631}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"5": 0.40704247003629207, "4": 0.34792553569226126, "3": 0.20282551531833665, "2": 0.022695014594562496, "1": 0.019347017611307138}, "score": 4.100802449329814}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6852477001672899, "4": 0.24539932434241712, "3": 0.06575695723907933, "2": 0.0021883181461239925, "1": 0.0009676733267596889}, "score": 4.6124805945184795}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5378351706602398, "3": 0.29068536984917154, "5": 0.14818295295951872, "2": 0.020595301741493263, "1": 0.0026765275898543877}, "score": 3.8082726655640733}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5509597398068291, "4": 0.2777944853530108, "3": 0.14646170265854275, "2": 0.012903173372484618, "1": 0.011857701581733627}, "score": 4.3431265452426135}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4956646647672648, "5": 0.3065056775377835, "3": 0.17581211193513382, "2": 0.013413957629326713, "1": 0.006728001051663787}, "score": 4.0838388943359245}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"4": 0.57694846031951, "5": 0.2137066283624027, "3": 0.20095877328407896, "2": 0.007180590190975305, "1": 0.001183167635861521}, "score": 3.994837056241037}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5308533887037642, "4": 0.4285506263850992, "3": 0.03972313561282187, "2": 0.0006372006244106703, "1": 0.00021924494123996325}, "score": 4.48920614182517}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.65083942902549, "5": 0.2532384104950534, "3": 0.09325436610993913, "2": 0.0022051787667799593, "1": 0.00042011826625643626}, "score": 4.154319890237086}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6616263820063802, "5": 0.25497950744851133, "3": 0.08156508406043242, "2": 0.0015588405051644143, "1": 0.0002592903711820988}, "score": 4.169520718295554}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4890496308875172, "4": 0.4721515804176198, "3": 0.03840276948438227, "2": 0.00034238925349839287, "1": 4.8408555177314604e-05}, "score": 4.44981920591742}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8241834420521341, "3": 0.1167113717658011, "5": 0.05529188092217264, "2": 0.0036254988005130465, "1": 0.0001830844566203424}, "score": 3.9307799313281295}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7562066149075672, "5": 0.2271497017015289, "3": 0.016572907420840995, "2": 5.607379314205224e-05, "1": 0}, "score": 4.210467741028368}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8576360359647044, "3": 0.11234298737127746, "5": 0.028662942288663378, "2": 0.0013157605704232152, "1": 4.027168264062645e-05}, "score": 3.9135674456800733}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.883054918460695, "3": 0.06438716287375537, "5": 0.052246049429526445, "2": 0.0002853893984207168, "1": 0}, "score": 3.9872877711411743}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8173564892002891, "3": 0.15682756332546866, "5": 0.02314270191972352, "2": 0.0026179518593350327, "1": 5.3088352715520586e-05}, "score": 3.8609196630976643}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5228812166127449, "3": 0.30865380572186246, "5": 0.13344338146204326, "2": 0.027091750690524993, "1": 0.007901734394482123}, "score": 3.7468937560761084}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5168153628906449, "5": 0.44498086399453163, "3": 0.037602580523392264, "2": 0.0004931254272259991, "1": 0.00010249126320941556}, "score": 4.406086823126981}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6216397711959452, "5": 0.2602177496029202, "3": 0.11478756727037275, "2": 0.0029621971665723407, "1": 0.0003688819071388113}, "score": 4.138402440803573}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5037850197617747, "5": 0.4612985184997695, "3": 0.034617324989435025, "2": 0.0002488104988598025, "1": 3.9111578871157536e-05}, "score": 4.426071016022392}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7158441953217314, "5": 0.1545896796858162, "3": 0.12662422966817596, "2": 0.0025592137412235793, "1": 0.00036280200981717747}, "score": 4.02175904906635}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7085016152765595, "5": 0.19985577451431066, "3": 0.08992994505779707, "2": 0.0016466280304749574, "1": 5.8716721968699646e-05}, "score": 4.106457202538846}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6012967535519499, "5": 0.3525347429593074, "3": 0.04550577672932694, "2": 0.0005393375126510481, "1": 0.00011123827897461169}, "score": 4.3056202899500535}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7107807252856665, "5": 0.2488240895136695, "3": 0.04019077448970248, "2": 0.0001730378848272487, "1": 1.7076573576567607e-05}, "score": 4.208238986570726}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7959355211493022, "4": 0.20185370028416746, "3": 0.0020888554386978408, "2": 3.6042386583600076e-06, "1": 0}, "score": 4.793933394550609}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6891138376934698, "5": 0.23959475587009596, "3": 0.07052320319357433, "2": 0.0006694134344486184, "1": 8.370147149817707e-05}, "score": 4.16748414845039}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5780563637070176, "2": 0.3233992341376817, "4": 0.07945096818355242, "1": 0.015790765055316913, "5": 0.0033013493504775544}, "score": 2.731072547768682}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5602465916180595, "4": 0.3687005802391461, "2": 0.03549952723192528, "5": 0.033500832155397786, "1": 0.0020515862593507117}, "score": 3.3960998943559346}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5346730876368734, "3": 0.34177522323522674, "5": 0.10545822247400535, "2": 0.017159788674568268, "1": 0.000923413525961969}, "score": 3.72659037491141}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5455150416656421, "5": 0.31347928426248894, "3": 0.1390344965532622, "2": 0.0017726859442191026, "1": 0.00019132959286308174}, "score": 4.170326646918498}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6584809418363046, "3": 0.21733124818726382, "5": 0.12013210100183719, "2": 0.0037566337569027485, "1": 0.00028820226941068456}, "score": 3.89442183054656}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8069231616930385, "4": 0.1884371216293053, "3": 0.004622414922297532, "2": 1.2609967314764061e-05, "1": 0}, "score": 4.802279290960497}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8759130333252553, "4": 0.12256266852668753, "3": 0.0015112736603685182, "2": 2.8007004817986048e-06, "1": 0}, "score": 4.874405097995577}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9794307690335263, "4": 0.020287310234481732, "3": 0.00027145898449568027, "2": 9.515638955702881e-07, "1": 0}, "score": 4.979166718976513}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9721368969064955, "4": 0.02765050741018711, "3": 0.00021140686734078857, "2": 2.551561822156007e-07, "1": 0}, "score": 4.971925887174915}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9627997362633325, "4": 0.03696618511590195, "3": 0.00023072985284672943, "2": 1.7376257170192884e-07, "1": 0}, "score": 4.9625717150556845}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5634833462866468, "5": 0.42329197069116353, "3": 0.013122876159725539, "2": 7.603711360254488e-05, "1": 1.450495852142942e-05}, "score": 4.409978123746278}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8621358776986245, "4": 0.13644873536376234, "3": 0.001353102736910933, "2": 3.1115081923946914e-06, "1": 0}, "score": 4.860827489425664}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6538252925408611, "4": 0.3366310350167294, "3": 0.00950202828005989, "2": 1.7647542842478036e-05, "1": 0}, "score": 4.64430343027938}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6422909852018849, "4": 0.3526035291975382, "3": 0.0050734967744987276, "2": 1.4724261242114518e-05, "1": 0}, "score": 4.637199040869056}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.982170950270481, "4": 0.017675430695498567, "3": 0.00013579841696685513, "2": 4.502226944668876e-07, "1": 0}, "score": 4.9820513100266615}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7679944825806881, "3": 0.1981021841195391, "5": 0.032712261563574076, "2": 0.0011055981259552687, "1": 7.688229054319718e-05}, "score": 3.8321667924117526}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7313554029770828, "5": 0.18202446097041358, "3": 0.08628192039512221, "2": 0.00028911587461094964, "1": 3.0685847596556955e-05}, "score": 4.095074001969789}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.68050880361101, "4": 0.30729268937254384, "3": 0.01207236889597651, "2": 3.828463183020814e-05, "1": 0}, "score": 4.668418588356231}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6649860207339124, "4": 0.32026125320795285, "3": 0.014652387317047882, "2": 6.860398050922485e-05, "1": 2.675615547175796e-05}, "score": 4.650119393677164}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5869344117879312, "4": 0.396027747792253, "3": 0.016999633397693573, "2": 2.508518813890936e-05, "1": 0}, "score": 4.569892086043301}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7166299646186134, "4": 0.2645693683171097, "3": 0.018593195472661563, "2": 0.00013662399054548623, "1": 0}, "score": 4.697812959539039}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9238462142376506, "4": 0.07352572014723305, "3": 0.002594705386560493, "2": 1.1892138576243016e-05, "1": 0}, "score": 4.921247501998205}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8884190625694323, "4": 0.10585386162676202, "3": 0.005623632340058615, "2": 2.7029789104002808e-05, "1": 0}, "score": 4.882808829317821}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9527651814568386, "4": 0.046321169396390915, "3": 0.000865476790498905, "2": 7.033036576184932e-06, "1": 0}, "score": 4.9519248001318665}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9363899743610137, "4": 0.06248464077754128, "3": 0.0010352467239965165, "2": 5.078944975149363e-06, "1": 0}, "score": 4.93542413616871}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7608192619887618, "4": 0.2338129598801261, "3": 0.00531797865444868, "2": 4.255777472051565e-05, "1": 4.4251472642573105e-06}, "score": 4.755405019982621}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9039289832749479, "4": 0.09543527595072832, "3": 0.0006254757486199857, "2": 1.632243678111582e-06, "1": 0}, "score": 4.903308041100392}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9593496653577004, "4": 0.040261334994233254, "3": 0.0003793317143216785, "2": 2.0968528084413377e-06, "1": 0}, "score": 4.958973400402993}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8363371899125971, "4": 0.15881540913841694, "3": 0.004774490558788978, "2": 3.3056048427969497e-05, "1": 0}, "score": 4.831529727326895}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8629267067091067, "4": 0.13114309810718838, "3": 0.005813045284974766, "2": 6.63801826562682e-05, "1": 0}, "score": 4.857024411944882}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6174094505610811, "3": 0.3256611354631363, "2": 0.03506396198593303, "5": 0.020616342344553236, "1": 0.001247696784116409}, "score": 3.621083657201011}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5471322677673839, "4": 0.4461970537438562, "3": 0.006649680304375446, "2": 1.3819872022206605e-05, "1": 0}, "score": 4.540458827301245}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7379642775182599, "4": 0.26015403007881666, "3": 0.0018749899117016956, "2": 3.7288227155007156e-06, "1": 0}, "score": 4.736084018830993}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9166405301131116, "4": 0.08250598028216358, "3": 0.000835963588712277, "2": 1.1670317482698996e-06, "1": 0}, "score": 4.9158172143003}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9047996328143433, "4": 0.09356524299352197, "3": 0.0016249396538212475, "2": 6.218461680804556e-06, "1": 2.3640270878610685e-06}, "score": 4.903156611057534}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4937714108303232, "2": 0.3935682982940127, "4": 0.08907916591160672, "1": 0.020397804632029032, "5": 0.0031772666367666613}, "score": 2.6610677398344524}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6417743607987776, "3": 0.3011288297462869, "5": 0.04539745648789366, "2": 0.011182905067201189, "1": 0.0005127800280380197}, "score": 3.7203634508520773}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5488947489328099, "3": 0.4058814731730544, "5": 0.02253750203857785, "2": 0.021798894968286353, "1": 0.0008778679274154634}, "score": 3.570420548574628}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6514240085320268, "3": 0.2572325601391181, "5": 0.08594348928942987, "2": 0.005103279023850253, "1": 0.00028777662108809095}, "score": 3.8176394207113002}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7350495257989355, "5": 0.17116893263420505, "3": 0.0923503299059009, "2": 0.0013492431140736763, "1": 7.553994264098615e-05}, "score": 4.075893984564624}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.797066393018199, "4": 0.19057922339991631, "3": 0.011430448078217569, "2": 0.0005136933838388601, "1": 0.00021345532452549592}, "score": 4.784122497152067}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7029330826266225, "4": 0.26531239453205957, "3": 0.02773806281965098, "1": 0.0020045988761684505, "2": 0.0019770619498576487}, "score": 4.665250249452331}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.638342510101957, "4": 0.31826226608295105, "3": 0.03763917811190632, "2": 0.0030986885666968124, "1": 0.002440832766890416}, "score": 4.5873106236185235}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5519223019219854, "4": 0.42339149833248885, "3": 0.023927884132637176, "2": 0.0005855148572079667, "1": 0.00015448014209756887}, "score": 4.526369591062519}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5475159693249758, "4": 0.36997918562270987, "3": 0.0666570341027782, "2": 0.00869454031772591, "1": 0.007141765244960409}, "score": 4.442049644804035}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5872017391021466, "4": 0.3526422471906229, "2": 0.0373354761920879, "5": 0.02128853742887382, "1": 0.0015265209830916439}, "score": 3.354832748055337}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5898705930223409, "5": 0.34035326025827606, "3": 0.06910582179644276, "2": 0.0005919289187312143, "1": 6.137426177670827e-05}, "score": 4.269884051735857}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5306147865840009, "4": 0.46165902569819917, "3": 0.007335974647033025, "2": 7.029366289120427e-06, "1": 0}, "score": 4.52346533659123}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6601609104267887, "4": 0.32558764203890717, "3": 0.014159654368764861, "2": 4.783294164846819e-05, "1": 0}, "score": 4.645933985577352}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6307082403464449, "5": 0.2531211123136929, "3": 0.11468273377063551, "2": 0.0013646435772630805, "1": 9.940749944648515e-05}, "score": 4.135414100208145}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6289164128895782, "5": 0.26007456516151173, "3": 0.1033377013433266, "2": 0.006671216846078793, "1": 0.0009693329533343599}, "score": 4.140490754279793}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.542154344300024, "4": 0.42149317240450407, "3": 0.035269891888240104, "2": 0.0006439251920630227, "1": 0}, "score": 4.505818487509136}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9373720916678888, "4": 0.061688817769399086, "3": 0.000907323954659101, "2": 7.5877762020051325e-06, "1": 0}, "score": 4.936472234965528}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5028925449671988, "4": 0.4849941742366466, "3": 0.011990298673933105, "2": 5.386557321380986e-05, "1": 0}, "score": 4.490828439514732}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5483951364231842, "4": 0.4362407801567533, "3": 0.015231515644314467, "2": 0.00010644070376814999, "1": 0}, "score": 4.532964664177478}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9191708043254928, "4": 0.08038613242098987, "3": 0.000418819717135881, "2": 6.478588424818047e-07, "1": 0}, "score": 4.918772367947197}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8912517265789713, "4": 0.10848550601935204, "3": 0.0002447571655413976, "2": 3.781609266676299e-07, "1": 0}, "score": 4.891021923657147}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9409811730336906, "4": 0.058646991559878896, "3": 0.00031261598676555634, "2": 6.889128924344649e-07, "1": 0}, "score": 4.940722240170589}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9714001214934841, "4": 0.028443176187244977, "3": 7.75884486079925e-05, "1": 0, "2": 0}, "score": 4.9713993842101205}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.93531009712459, "4": 0.06440285593746985, "3": 0.00026194316636636453, "2": 6.304361219479434e-07, "1": 0}, "score": 4.935069777362313}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9316145991918612, "4": 0.0674787260776439, "3": 0.0008983843271354833, "2": 6.018153940943015e-06, "1": 1.691279863445271e-06}, "score": 4.930699645425411}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9049711321208275, "4": 0.09234569403570095, "3": 0.002654502564090422, "2": 1.3758881707761858e-05, "1": 0}, "score": 4.902302567288027}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8870427035784825, "4": 0.10907893331241364, "3": 0.0037608604675850787, "2": 3.4878080220085356e-05, "1": 0}, "score": 4.883285067991703}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8778030299320706, "4": 0.11870894763062545, "3": 0.0034336436259777233, "2": 3.415293606821419e-05, "1": 1.2168219062564507e-05}, "score": 4.8742716203569065}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9403598912119355, "4": 0.05876475550269211, "3": 0.0008179830032503145, "2": 2.3338331812110217e-06, "1": 0}, "score": 4.9395889521817145}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.600569023912631, "4": 0.3791745977124786, "3": 0.019768953044101013, "2": 0.00032914801985614166, "1": 8.988630176587334e-05}, "score": 4.579911776675155}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5534830005233673, "4": 0.4197285861707674, "3": 0.025697938610656886, "2": 0.0007160379425638963, "1": 0.0003478426276042169}, "score": 4.525323428661719}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7153300889174602, "4": 0.2656930722860055, "3": 0.01768648482993175, "2": 0.0008956933919825099, "1": 0.0003924077814763053}, "score": 4.694676558921724}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6529573015338739, "4": 0.33036786597833334, "3": 0.016059795564945342, "2": 0.00039082565209240294, "1": 0.00016090587359532334}, "score": 4.6356733785996544}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8782825729961704, "4": 0.11763657264338952, "3": 0.0038503008148786924, "2": 0.00012613926293192045, "1": 0.00010192380842818432}, "score": 4.873876398596768}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5122818382812813, "4": 0.4349520864725885, "3": 0.05169280372996399, "2": 0.0008763897902124037, "1": 0.00018127560595015494}, "score": 4.458299580431292}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8421032732037484, "4": 0.15370747437258916, "3": 0.004101418867068275, "2": 9.090942225283603e-06, "1": 0}, "score": 4.838049662673641}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.735034060519608, "4": 0.25448748984883524, "3": 0.010381380644728513, "2": 5.6618373799596784e-05, "1": 0}, "score": 4.724568752377496}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9409174331279243, "4": 0.058512738284212606, "3": 0.0005541201596833303, "2": 1.400641796943671e-06, "1": 0}, "score": 4.940373966354477}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7552106515298342, "4": 0.23798410339484793, "3": 0.006765710479741945, "2": 1.4922938980200761e-05, "1": 0}, "score": 4.748433515360796}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6606847908255771, "5": 0.26061491047087876, "3": 0.07763147720152032, "2": 0.0008385410679694763, "1": 0.00011512431654966473}, "score": 4.1809818193474255}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6252058646753532, "4": 0.35642184206785715, "3": 0.018144340229259107, "2": 0.00010797271517788754, "1": 0}, "score": 4.606918397274615}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7167406638320286, "5": 0.2498493606826199, "3": 0.033140456240981005, "2": 0.00019734363672065653, "1": 0}, "score": 4.216329830905196}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8711537556343795, "4": 0.12594377522414144, "3": 0.0027092582230228766, "2": 4.528761750930999e-06, "1": 0}, "score": 4.868599329082578}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5672535199799312, "5": 0.421563103922465, "3": 0.010900894814969787, "2": 1.863078943225032e-05, "1": 0}, "score": 4.410733319717612}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8857616700426568, "4": 0.11346617546497315, "3": 0.000769952294677591, "2": 1.442587762298436e-06, "1": 0}, "score": 4.884989504819272}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7204254058440887, "5": 0.2632663293690233, "3": 0.016240411595813124, "2": 5.68260051423131e-05, "1": 5.581047919553399e-06}, "score": 4.2468968672535805}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9250944579320205, "4": 0.07463714301782864, "3": 0.00026722835578031536, "2": 3.958098174570657e-07, "1": 0}, "score": 4.924827154590882}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8543529672377613, "4": 0.14466872580153148, "3": 0.0009688500550478133, "2": 7.808669969567406e-07, "1": 0}, "score": 4.853389959493002}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7257918596203092, "4": 0.2730303821671195, "3": 0.0011694356464545187, "2": 1.4631849874544426e-06, "1": 0}, "score": 4.724624468079282}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7869478162046036, "4": 0.20674777643190323, "3": 0.006264939797611926, "2": 3.102184264942296e-05, "1": 5.5454155421325566e-06}, "score": 4.780606460473987}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.677515417520082, "4": 0.31920530304340017, "3": 0.003252873237909853, "2": 7.29069266997506e-06, "1": 0}, "score": 4.674260851734147}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6847248364743427, "4": 0.3091446155744029, "3": 0.0060942681322617214, "2": 2.1572827959803693e-05, "1": 0}, "score": 4.67859740281208}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7713138264802629, "4": 0.2246244235856783, "3": 0.004038746126136111, "2": 1.5953281710857605e-05, "1": 0}, "score": 4.7672485832969524}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6760167669948155, "4": 0.3174439537035155, "3": 0.006482314217787025, "2": 3.6592363019464076e-05, "1": 0}, "score": 4.6694749070763955}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.787078137683158, "4": 0.20648485720423004, "3": 0.006349848656395921, "2": 6.188745898572734e-05, "1": 1.4668136526788577e-05}, "score": 4.780568784400164}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9272386204984591, "4": 0.07190715543097208, "3": 0.0008337677263257766, "2": 4.445220873085349e-06, "1": 0}, "score": 4.926410795207921}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6069876282051236, "4": 0.3883498384916689, "3": 0.00462548753777683, "2": 2.2593913547828983e-05, "1": 0}, "score": 4.602325657561439}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9809846979092011, "4": 0.01887321231727559, "3": 0.0001333913859041317, "2": 8.255120305830951e-07, "1": 0}, "score": 4.98085737766734}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.984698692051805, "4": 0.015164046725330518, "3": 0.00010611724396087438, "2": 6.569223593173413e-07, "1": 0}, "score": 4.984621279167738}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5133399924610453, "3": 0.26008452620811023, "5": 0.20788494528327436, "2": 0.015320286711422526, "1": 0.003353143550025721}, "score": 3.9070988258546264}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5902130237762343, "5": 0.32037464576088615, "3": 0.08750507388872958, "2": 0.0016647896497788716, "1": 0.00023985859398334612}, "score": 4.2288210136314515}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6393073208001211, "4": 0.2939729566670308, "3": 0.06534000475735416, "2": 0.0010965383673228262, "1": 0.0002625985809385329}, "score": 4.570998195180511}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8863347216933595, "4": 0.10913957623465563, "3": 0.004376069202009284, "2": 8.83333351570776e-05, "1": 5.814300375473279e-05}, "score": 4.881610339640194}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5121285045423125, "4": 0.4628284277441176, "3": 0.024764997844007142, "2": 0.0002194208462113027, "1": 4.394942574571591e-05}, "score": 4.486799972492356}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.56472002591778, "4": 0.40345482314755043, "2": 0.020723548844044176, "5": 0.010366431848413946, "1": 0.0007160031439655009}, "score": 3.4020398376494705}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.779405967169668, "3": 0.15294987892256803, "5": 0.06411679736554361, "2": 0.0033810113441408805, "1": 0.00014376205800942511}, "score": 3.9039733615304075}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7055291713978596, "3": 0.2584204679184328, "5": 0.030580895349062904, "2": 0.005349205145749035, "1": 0.00011641967590122129}, "score": 3.761111840658348}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7036506160736813, "3": 0.25766355383065753, "5": 0.02978840664274735, "2": 0.008651046350312686, "1": 0.00024326674515181307}, "score": 3.7540921950148354}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8028422782149502, "5": 0.11035296252669712, "3": 0.08534185200240493, "2": 0.0014004028972678195, "1": 5.9259467599816956e-05}, "score": 4.0220325978203375}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9833683507679288, "4": 0.016536801297795684, "3": 8.339201471551151e-05, "1": 0, "2": 0}, "score": 4.9832962233156515}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9974371444362683, "4": 0.002534759799695979, "3": 7.238431635240565e-06, "1": 0, "2": 0}, "score": 4.997450710165649}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9866348603337133, "4": 0.013171432489598584, "3": 4.0146270943680474e-05, "1": 0, "2": 0}, "score": 4.9867462397090785}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985069623913015, "4": 0.001461694792073075, "3": 5.6095783594362275e-06, "1": 0, "2": 0}, "score": 4.998527048147386}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998277043895984, "4": 0.00170926350512881, "3": 4.125666398805701e-06, "1": 0, "2": 0}, "score": 4.998282468730568}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7742066123454733, "5": 0.11645110426003626, "3": 0.10667988048308372, "2": 0.0023095963730429187, "1": 0.0003496219954902466}, "score": 4.0041031781111425}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5014867162333774, "3": 0.3788396312465052, "5": 0.08044972691645774, "2": 0.035989091511980785, "1": 0.003214419491870844}, "score": 3.6199808962324553}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6327921549287865, "5": 0.2042926406660468, "3": 0.15867233329697394, "2": 0.0037446339891253886, "1": 0.00047141959530896244}, "score": 4.036717765284438}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5629603047437535, "5": 0.41083960340998515, "3": 0.02600419780381665, "2": 0.00015355803257603576, "1": 2.6557244100924115e-05}, "score": 4.38445468402912}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4751344083629035, "3": 0.45084634318681055, "2": 0.04830658462382261, "5": 0.02340092330308755, "1": 0.0023078613633801125}, "score": 3.4690157670056965}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5631947702269745, "5": 0.3966350859366076, "3": 0.03969269949550676, "2": 0.00041785377801488644, "1": 4.255611499966635e-05}, "score": 4.3559850745492765}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7086594445031347, "4": 0.2885259641585832, "3": 0.0027901358292915994, "2": 9.944330183629944e-06, "1": 0}, "score": 4.705859662869257}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.923585611811133, "4": 0.07479162989966852, "3": 0.0016071369097401455, "2": 1.0699869637305771e-05, "1": 0}, "score": 4.921961612605249}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9535681433032415, "4": 0.04618157823104419, "3": 0.0002407383256621765, "2": 3.812799327406812e-07, "1": 0}, "score": 4.953335373883049}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8871796682226464, "4": 0.1113069031180469, "3": 0.001498294226934129, "2": 5.333355330139245e-06, "1": 0}, "score": 4.885679387896967}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6211016641880536, "4": 0.36688743301733423, "3": 0.011946076271535466, "2": 3.935706722957743e-05, "1": 0}, "score": 4.6090923870337175}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9561259937395762, "4": 0.04358100014919, "3": 0.0002915358719156546, "2": 4.171887832364068e-07, "1": 0}, "score": 4.955834630032263}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5102628979013476, "5": 0.4803947102372621, "3": 0.009323038351801738, "2": 1.1319179162103986e-05, "1": 0}, "score": 4.471052818121126}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9069454899104449, "4": 0.09214311617906155, "3": 0.0008984765060961472, "2": 1.1222578100840605e-06, "1": 0}, "score": 4.906055455945647}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6687089940234623, "4": 0.3296148260535145, "3": 0.001578006401262225, "2": 9.235064989759902e-07, "1": 0}, "score": 4.667194025238339}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6576300498764966, "5": 0.19326232810340757, "3": 0.13684499733379274, "2": 0.00941762825213719, "1": 0.0028172622469837256}, "score": 4.029131095451643}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6493386081801745, "5": 0.26018577080663124, "3": 0.0846680467980666, "2": 0.00447097577498177, "1": 0.001331937673001017}, "score": 4.162580717190463}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6393316149398972, "4": 0.32562931992441596, "3": 0.032598839154537505, "2": 0.001375579750500161, "1": 0.0010298626861965754}, "score": 4.600912930107387}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6257851109854172, "5": 0.19192033786599533, "3": 0.16515748594770968, "2": 0.014192886366542467, "1": 0.002922867862496204}, "score": 3.989608254139509}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5181551625365105, "5": 0.43321072783494735, "3": 0.04645118512751879, "2": 0.0016915026552232323, "1": 0.0004787977421188063}, "score": 4.381944965883476}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8478970702326029, "4": 0.1505594584584953, "3": 0.001526819294435809, "2": 4.116669892316668e-06, "1": 0}, "score": 4.8463726271709024}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6372556815716652, "4": 0.3587261481900443, "3": 0.003991690314780177, "2": 5.715893099776902e-06, "1": 0}, "score": 4.633265708619117}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7740515929931818, "4": 0.22445040709749844, "3": 0.0014840372996763787, "2": 4.049512720541685e-06, "1": 0}, "score": 4.772567115200757}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9593710590937772, "4": 0.040328784879312206, "3": 0.00028954610971702085, "2": 6.490111111323787e-07, "1": 0}, "score": 4.9590897683649455}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8356321037835498, "4": 0.1635575602731165, "3": 0.000713777477758408, "2": 1.1105257568047421e-06, "1": 0}, "score": 4.834995803883516}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4816393651787267, "4": 0.4520442525818672, "2": 0.03340788931019074, "5": 0.030778080944414445, "1": 0.0021241002033431503}, "score": 3.475947328829344}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.47676811422276016, "5": 0.29527640358839086, "3": 0.19832089070773187, "2": 0.023664105849632768, "1": 0.005963603896677326}, "score": 4.031736707894969}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7574902446737659, "3": 0.16371379960845445, "5": 0.0722953620905623, "2": 0.006060996824115558, "1": 0.00043680005832747105}, "score": 3.8951488754170596}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7811112841379003, "5": 0.1749082374518588, "3": 0.04373035480730044, "2": 0.00021403200458264865, "1": 3.0485755994831786e-05}, "score": 4.130659093821691}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.786657360164448, "3": 0.11492429175271782, "5": 0.09677041128201418, "2": 0.0014978335722886284, "1": 0.00014568788478571453}, "score": 3.9784132934176326}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5257754807753968, "3": 0.23726329621656708, "5": 0.2248447083896221, "2": 0.010543623598803184, "1": 0.0015106896659629742}, "score": 3.9619597298212605}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9384087474704408, "4": 0.060510825262059434, "3": 0.0010743880879302728, "2": 4.223239797246673e-06, "1": 1.1432962733036641e-06}, "score": 4.937323113498395}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8492842356063184, "4": 0.14862357676953275, "3": 0.002072211260669227, "2": 6.985604684480573e-06, "1": 0}, "score": 4.847209059024815}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8423221979810056, "4": 0.15384891954818106, "3": 0.0037841325474882487, "2": 2.1426480378959906e-05, "1": 0}, "score": 4.838514769524146}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8340571531621417, "4": 0.1586164428796285, "3": 0.007292885464188837, "2": 2.713603523217824e-05, "1": 3.6871933466015055e-06}, "score": 4.826701162226539}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8231026166419719, "4": 0.17507894368592175, "3": 0.0015598166448204831, "2": 3.1844371613113735e-06, "1": 0}, "score": 4.821746336848554}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8904065614002976, "4": 0.10880183270359557, "3": 0.0007630319144241328, "2": 9.201740500127917e-07, "1": 0}, "score": 4.889666291798264}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9267697556951778, "4": 0.07240603693402481, "3": 0.0007313630303092889, "2": 1.0908951066074262e-06, "1": 0}, "score": 4.926121185684283}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.957932828363834, "4": 0.041801581718995125, "3": 0.00024291645022016223, "2": 9.597960720479078e-07, "1": 0}, "score": 4.957708787694883}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9525213314585281, "4": 0.047238171264124114, "3": 0.00021849050494546828, "2": 4.77937913961906e-07, "1": 0}, "score": 4.952322387468814}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7312007961618477, "5": 0.2463242306724581, "3": 0.022332275836161295, "2": 0.00010050832480651592, "1": 0}, "score": 4.223800380101978}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7692722814796916, "4": 0.22606192789753266, "3": 0.004639633049642775, "2": 1.5736636957035527e-05, "1": 0}, "score": 4.7646091430992135}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9540051683412932, "4": 0.045664115881118676, "3": 0.00025358182650895097, "2": 3.4561652008053295e-07, "1": 0}, "score": 4.953824137848752}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9976042728459817, "4": 0.0023670131332182705, "3": 1.1236614049821866e-05, "1": 0, "2": 0}, "score": 4.997610471875927}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7211783121494294, "4": 0.27321722615425903, "3": 0.0055510587702697085, "2": 1.3543145578430974e-05, "1": 0}, "score": 4.715628691890554}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5225671221233055, "4": 0.4314668916101545, "3": 0.04503124035351211, "2": 0.0006144828120351883, "1": 0}, "score": 4.476459508545427}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6155807363413296, "4": 0.35577100481590856, "3": 0.02795056122433426, "2": 0.0005161110512693495, "1": 0.00015304615735651486}, "score": 4.58615554366181}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8577622378154788, "4": 0.13786230249141318, "3": 0.004165859758733768, "2": 1.3548875540812275e-05, "1": 0}, "score": 4.853736656281093}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9332423148928247, "4": 0.06481563654671216, "3": 0.0019249928991546968, "2": 1.1576330715243838e-05, "1": 0}, "score": 4.931299272228833}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9653616567684637, "4": 0.03432332591886214, "3": 0.0003080113269054077, "2": 1.1016946199717872e-06, "1": 0}, "score": 4.965057140030648}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7115909294281397, "5": 0.27053077942917925, "3": 0.017558431800040332, "2": 7.620404596711141e-05, "1": 0}, "score": 4.252881555467625}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8468968961634147, "4": 0.1517695996328135, "3": 0.0013088235482929887, "2": 3.3321377266003982e-06, "1": 0}, "score": 4.845599460634766}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4987035240411222, "5": 0.4970777134593011, "3": 0.0042005408003240935, "2": 9.123938445526055e-06, "1": 0}, "score": 4.492863408735489}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7393882676485023, "4": 0.25761042908320736, "3": 0.0029337406436966067, "2": 1.8939421774534724e-05, "1": 0}, "score": 4.736452456838432}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6005059674756411, "4": 0.3950341508382194, "3": 0.004434138200125755, "2": 1.2747441157893795e-05, "1": 0}, "score": 4.596054080738769}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8256184228543403, "4": 0.17225021860061027, "3": 0.00210090893858104, "2": 8.999855826807278e-06, "1": 0}, "score": 4.823517178442232}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8357465096494606, "4": 0.1630236820627879, "3": 0.0009989271548923948, "2": 2.4927201849876047e-06, "1": 0}, "score": 4.83493328614211}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9424438170441383, "4": 0.056954213834502436, "3": 0.0005151723773518379, "2": 1.0278580336810217e-06, "1": 0}, "score": 4.942007383874612}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9775586557896343, "4": 0.022299061201269833, "3": 0.00013584269446762675, "2": 5.930316895502754e-07, "1": 0}, "score": 4.97742734232601}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9559307555376427, "4": 0.043829836275594496, "3": 0.0001848497915968324, "2": 8.085834074877965e-07, "1": 0}, "score": 4.9557956624161665}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6045104633371009, "5": 0.3864110035318254, "3": 0.008991927936879335, "2": 2.7715326348610196e-05, "1": 0}, "score": 4.3773858691462095}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5238799101655551, "5": 0.46714265353688933, "3": 0.008878878721963036, "2": 4.129521187286586e-05, "1": 0}, "score": 4.458207422431263}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6685548342500218, "4": 0.31224994691015107, "3": 0.01879518234933546, "2": 0.00033898947441132396, "1": 4.92524719365823e-05}, "score": 4.648941569506043}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5150167781072762, "4": 0.4725861313922746, "3": 0.012282657142345693, "2": 6.866520256081475e-05, "1": 0}, "score": 4.5026197945407445}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7667310967691485, "5": 0.20182023571494978, "3": 0.03121061555151995, "2": 0.00020871497348511102, "1": 0}, "score": 4.170197183289677}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6921733838856619, "5": 0.2737910923706891, "3": 0.03377425341646576, "2": 0.00022203223143198303, "1": 2.1082758167284165e-05}, "score": 4.239513874672108}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.49325714925648095, "4": 0.4877932846013396, "3": 0.01889757069186134, "2": 3.5851182743943214e-05, "1": 0}, "score": 4.474295533353131}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6894363977644268, "4": 0.30377599735190836, "3": 0.006754304321960579, "2": 1.9848502390494237e-05, "1": 0}, "score": 4.682651579507223}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7917680470094894, "4": 0.2044488821055165, "3": 0.0037308674949295575, "2": 7.639373200277167e-06, "1": 0}, "score": 4.788057019754477}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.740040303557614, "4": 0.25752107952393544, "3": 0.0023937837641664138, "2": 7.60245755836313e-06, "1": 0}, "score": 4.737658778428598}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5375697069715883, "5": 0.4087836647162526, "3": 0.05225110186678768, "2": 0.0012785904739945103, "1": 0.00010687709805244102}, "score": 4.353658308011439}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5400863201873619, "5": 0.4238329191585471, "3": 0.03578367124859145, "2": 0.00027603082878184217, "1": 1.7413165498588223e-05}, "score": 4.387446359157201}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5809025640887614, "5": 0.36387750234654104, "3": 0.054399245211777386, "2": 0.0007682584945516268, "1": 4.782469117765741e-05}, "score": 4.307799683541131}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.645495138561213, "4": 0.3488740186598416, "3": 0.005599219869294471, "2": 2.539614924399608e-05, "1": 3.5975733832185732e-06}, "score": 4.639836015921832}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7414261409388849, "3": 0.1492195153250902, "5": 0.10545586023627912, "2": 0.0036583150734995394, "1": 0.0002123284902903527}, "score": 3.9482812894477295}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5745458134294121, "3": 0.2902075855011373, "5": 0.10992789809158765, "2": 0.02250107259542964, "1": 0.002787087876839635}, "score": 3.7663497675055395}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6463239049548777, "5": 0.2684593964818322, "3": 0.08364654127360628, "2": 0.0012795207310932347, "1": 0.00028869032042525}, "score": 4.181388095809198}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5517862698412045, "5": 0.393410808037356, "3": 0.05382190169243607, "2": 0.0008199169527245802, "1": 0}, "score": 4.338003525982501}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5553622363662823, "5": 0.3172831455963484, "3": 0.1237678308792342, "2": 0.003169816117098118, "1": 0.00036804807122414474}, "score": 4.186080641886872}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6934109181759809, "4": 0.3006069444401906, "3": 0.005953128495765964, "2": 1.611799835696266e-05, "1": 0}, "score": 4.687434415324729}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.48876007699623375, "4": 0.45205159384014, "3": 0.0557606642466219, "2": 0.0025040546522601013, "1": 0.0009164234669080148}, "score": 4.4252450891948545}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.587549289183725, "4": 0.36226872800538634, "3": 0.04920198552986988, "2": 0.0006921718465579194, "1": 0.00026088209395734325}, "score": 4.536194760556877}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.42656569119798515, "3": 0.33335983060913915, "5": 0.11435316279474009, "2": 0.08877579011459734, "1": 0.03694194694486158}, "score": 3.4926140955232152}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5258971330044533, "3": 0.2509679342508447, "5": 0.18935962388907426, "2": 0.02656133213357677, "1": 0.007204020543448642}, "score": 3.8636556062715948}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5190085613992463, "4": 0.22746575031285354, "3": 0.1360759762956167, "1": 0.0746616802792166, "2": 0.04278603990685948}, "score": 4.073375610602257}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8231026166419719, "4": 0.17507894368592175, "3": 0.0015598166448204831, "2": 3.1844371613113735e-06, "1": 0}, "score": 4.821746336848554}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9520139013871098, "4": 0.04772874223390997, "3": 0.0001905134046988219, "2": 2.899451702340436e-07, "1": 0}, "score": 4.951886158999321}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9384793090768935, "4": 0.06044130803110391, "3": 0.0009926563761302536, "2": 2.156301656103273e-06, "1": 0}, "score": 4.937561629885331}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9332830200773233, "4": 0.06652286206178008, "3": 0.00013081885211594673, "2": 3.281713357027289e-07, "1": 0}, "score": 4.933210309917264}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9745070495921397, "4": 0.02526008745178173, "3": 0.00011136583111573361, "2": 1.1772705323806188e-07, "1": 0}, "score": 4.974513734197229}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6055638933021567, "3": 0.3028424426406818, "5": 0.07185458895148135, "2": 0.01853049918055422, "1": 0.001183784226807799}, "score": 3.728393061671991}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6469365482509425, "3": 0.28635121416731335, "5": 0.052091171372722574, "2": 0.013883558231790731, "1": 0.0007343841508334538}, "score": 3.7357688628771264}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7929486369498787, "3": 0.12272852213998191, "5": 0.0817333058372794, "2": 0.0024470428094688253, "1": 0.00012292680020878298}, "score": 3.953741012599219}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6919883353065256, "5": 0.2686121664837975, "3": 0.039089378441781286, "2": 0.0002760095752262986, "1": 2.4813815085361338e-05}, "score": 4.228898455372778}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7415582229409046, "3": 0.16267951162611874, "5": 0.09167991070516357, "2": 0.0038148230424515954, "1": 0.00024144544765883412}, "score": 3.920644346560727}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6880613799394135, "4": 0.29152692802904334, "3": 0.020218444442020884, "2": 0.0001146390570261794, "1": 0}, "score": 4.667666141638932}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.752741374754092, "4": 0.24389228648210343, "3": 0.0033226520655894594, "2": 7.606948135263684e-06, "1": 0}, "score": 4.749430548059108}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6307266446814161, "5": 0.3296849755521406, "3": 0.039362940569411496, "2": 0.0001971160335161885, "1": 0}, "score": 4.289936014820854}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9502452754759131, "4": 0.04921856447136076, "3": 0.0004986618236883675, "2": 1.0413787517177952e-06, "1": 0}, "score": 4.949779156851249}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7105048324430933, "4": 0.2799678230765973, "3": 0.009499219895599974, "2": 1.6391904058358435e-05, "1": 0}, "score": 4.700981053126215}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7437588076306092, "5": 0.23684700377464304, "3": 0.01928161167869795, "2": 8.71077238570647e-05, "1": 0}, "score": 4.217396713566911}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7208886874171306, "5": 0.25626341466180513, "3": 0.0227268916831548, "2": 7.259235098626569e-05, "1": 0}, "score": 4.233402638205612}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7288487095446052, "5": 0.24119103093470282, "3": 0.029671060563592637, "2": 9.128655892366058e-05, "1": 0}, "score": 4.211379231823957}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8777920925744576, "5": 0.10019379684322322, "3": 0.02189317794608441, "2": 8.682985880513294e-05, "1": 0}, "score": 4.078129623616693}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5093772387014277, "5": 0.48064878610568823, "3": 0.009928925641309162, "2": 3.7439172823064526e-05, "1": 0}, "score": 4.470648563932563}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8317689591950714, "4": 0.16414467096242294, "3": 0.004061731168773145, "2": 1.35131536829841e-05, "1": 0}, "score": 4.82768941019406}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.83115878945828, "4": 0.16606729187931138, "3": 0.002760963129946385, "2": 6.9687338973550325e-06, "1": 0}, "score": 4.828388848257707}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9492644788974836, "4": 0.05026640086107605, "3": 0.00044137089687159946, "2": 1.5141436898829997e-06, "1": 0}, "score": 4.948844972851697}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9830211463612237, "4": 0.016656928882876555, "3": 0.00031838347674045375, "2": 1.5203241336764217e-06, "1": 1.0187501756236912e-06}, "score": 4.982697650850041}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9420474633059343, "4": 0.05745255512760837, "3": 0.00048684215717233176, "2": 7.963460574788988e-07, "1": 0}, "score": 4.941570650322717}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5878356129402188, "4": 0.3668939636717645, "2": 0.034812683159301284, "5": 0.00861513016503766, "1": 0.0018275902192138496}, "score": 3.3456615521868613}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7777707531390937, "3": 0.11372143199392466, "5": 0.10726507195485224, "2": 0.0011658922561470983, "1": 7.456655318644982e-05}, "score": 3.9909881352050487}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8153309700141097, "3": 0.11689054440036545, "5": 0.06635901878572484, "2": 0.0013423761353623192, "1": 7.268336621118201e-05}, "score": 3.946565436513944}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7213394125282516, "3": 0.17846776184214788, "5": 0.09577723047204373, "2": 0.004258492732378295, "1": 0.0001463472991102634}, "score": 3.9083524555869147}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7970385200937962, "5": 0.15478964698576372, "3": 0.047751719606608345, "2": 0.0003984848810908102, "1": 1.2980010990019173e-05}, "score": 4.106202936071785}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6611049348936445, "4": 0.3248056095700511, "3": 0.013917155377832068, "2": 0.00012293571272487292, "1": 0}, "score": 4.646973845595663}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9155115215187601, "4": 0.0827998192967256, "3": 0.001581220439579912, "2": 4.614993954397616e-06, "1": 0}, "score": 4.91401505354753}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9448189595853519, "4": 0.05467480384937738, "3": 0.0004450795623418239, "2": 1.5460766955596554e-06, "1": 0}, "score": 4.944427086042977}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9514993570202224, "4": 0.04761877322571548, "3": 0.0008330065938853585, "2": 2.5667141960567793e-06, "1": 0}, "score": 4.950705231271328}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8378031924171803, "4": 0.1603024557132807, "3": 0.0018104792314365269, "2": 4.143747443357752e-06, "1": 0}, "score": 4.836051083116248}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5277424702506103, "5": 0.4097507422046938, "3": 0.06142056899563984, "2": 0.0009149150852506242, "1": 0.00013180051875209608}, "score": 4.346118614186895}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6503199021553445, "5": 0.31415760256382996, "3": 0.034969070786248266, "2": 0.000466898018474714, "1": 8.464538241639846e-05}, "score": 4.278001322539916}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5251263703115847, "4": 0.46293649228274153, "3": 0.011820988985361606, "2": 0.00010046732577436614, "1": 1.2507050908565199e-05}, "score": 4.513068554023925}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.49774135716286777, "4": 0.48924385149002186, "3": 0.012835527075720707, "2": 0.00015111219255228514, "1": 2.2562845702366764e-05}, "score": 4.484538625364275}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6629347234355873, "5": 0.26779058585064713, "3": 0.06781353314808161, "2": 0.0012920476415976252, "1": 0.00016874598855839322}, "score": 4.196886791107793}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"5": 0.683855993051443, "4": 0.2656042924971766, "3": 0.04942698741552234, "2": 0.0008381051399652356, "1": 0.0002356452645652825}, "score": 4.6320704955409715}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5599481997375696, "5": 0.34897796371184714, "3": 0.08951117510388083, "2": 0.001335640535934588, "1": 0.00017438178425911594}, "score": 4.256285852846751}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7353514138116052, "5": 0.22455801196306635, "3": 0.039731148577355276, "2": 0.0002677197054363685, "1": 0}, "score": 4.184308326143604}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6360502241312858, "4": 0.33756543701886293, "3": 0.026041274992364256, "2": 0.00019446390315915537, "1": 0}, "score": 4.609710624303528}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6692991893948902, "4": 0.3109349974697828, "3": 0.019392226288415047, "2": 0.00014481043727237726, "1": 0}, "score": 4.6497659933629985}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7387679594242245, "2": 0.18488074192788892, "3": 0.04972752879148782, "5": 0.015781435470333137, "4": 0.010836979128405443}, "score": 1.3799745136388384}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9538671910125053, "2": 0.019279217051236905, "5": 0.018870296631215124, "3": 0.005549863200978027, "4": 0.0024313539396119384}, "score": 1.113154426950397}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.8954927209411514, "5": 0.06927513773498457, "2": 0.028272126189662024, "3": 0.0050155374239987255, "4": 0.001937804592617352}, "score": 1.3212193092896716}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.4440941009185799, "5": 0.43897884330297593, "2": 0.05396789209988015, "3": 0.04082251138898144, "4": 0.022125749786654526}, "score": 2.9579268837532933}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9291553326510336, "2": 0.052134383285207815, "5": 0.011104287322134459, "3": 0.005916280626989876, "4": 0.001686902115370566}, "score": 1.1134451194083197}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7125666552406686, "5": 0.25161201523249865, "3": 0.035282531354728856, "2": 0.0004803981109548715, "1": 5.757371104015547e-05}, "score": 4.215196144350096}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5280298039468004, "5": 0.4615001961556464, "3": 0.010413315033777588, "2": 4.6234420722293495e-05, "1": 5.253100942578192e-06}, "score": 4.450980996880123}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6368816904102949, "5": 0.3450153052125002, "3": 0.018018625609386305, "2": 6.603679310363724e-05, "1": 1.0556001470695758e-05}, "score": 4.326835482744819}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7190662813816276, "5": 0.2621499003734754, "3": 0.018653490355011557, "2": 0.00010693333019377334, "1": 1.3507790025728372e-05}, "score": 4.243244424889601}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7423374164695433, "5": 0.23296745809472114, "3": 0.024622968322444174, "2": 6.397366779325211e-05, "1": 7.17319783994997e-06}, "score": 4.208195233171918}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.49664726163876066, "4": 0.46845981721508234, "3": 0.03464364762080822, "2": 0.00017068547885525328, "1": 0}, "score": 4.461698527045552}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9477260208879443, "4": 0.05085617135185207, "3": 0.001403924991027195, "2": 9.664115164369012e-06, "1": 3.394805801211957e-06}, "score": 4.9462933628512795}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8522122103377666, "4": 0.14094186198237413, "3": 0.006766847214585592, "2": 3.796860211160246e-05, "1": 0}, "score": 4.845404182060007}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9799890351525102, "4": 0.01904078731302163, "3": 0.0009080028868661759, "1": 3.534696588494435e-05, "2": 2.2060629692691485e-05}, "score": 4.978935536745237}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8402703278905977, "4": 0.15513228103369184, "3": 0.004559864366895825, "2": 2.5002418444371738e-05, "1": 6.725589354226501e-06}, "score": 4.835645127575001}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5181030957403672, "5": 0.3924072795940833, "3": 0.0840207068834741, "2": 0.003952590864595191, "1": 0.00147561562999471}, "score": 4.296066597343795}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.562230483596967, "3": 0.3082320717574267, "5": 0.09946470712506196, "2": 0.025526725929472825, "1": 0.004540848455128749}, "score": 3.726555226310764}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5911182186635955, "5": 0.2903951492080603, "3": 0.11267452793842013, "2": 0.004483882403136719, "1": 0.0013078064642583335}, "score": 4.164832802185412}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.4708712626657984, "4": 0.4359917010950152, "3": 0.0869288248787416, "2": 0.004634946141447535, "1": 0.0015687706371740496}, "score": 4.369967896443622}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5421353963368082, "4": 0.4166237052790942, "3": 0.03955632790376377, "2": 0.0012848079847635906, "1": 0.000393633887579356}, "score": 4.498831607944159}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5552644234766029, "4": 0.4148866618612121, "3": 0.028453855760016054, "2": 0.0010843163312924055, "1": 0.00030665537436196317}, "score": 4.523724109494271}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5686589894902392, "5": 0.4108556880953143, "3": 0.020017081398766914, "2": 0.00037942340987799167, "1": 7.368870698657382e-05}, "score": 4.389864591977796}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7895668381777072, "4": 0.20181290977336, "3": 0.008341896419759064, "2": 0.00017247038799946292, "1": 0.0001002419293755841}, "score": 4.780583680270915}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5195229252318868, "4": 0.4622724699245765, "3": 0.017874681656271714, "2": 0.00028053726213169295, "1": 4.426408199331368e-05}, "score": 4.500956942628251}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5809090934702767, "5": 0.35875161865075644, "3": 0.056772274353914805, "2": 0.0029132353828365534, "1": 0.0006424882688248216}, "score": 4.29422873052981}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9259344270169214, "4": 0.07345669720911625, "3": 0.0005851917421947356, "2": 3.088679205560465e-06, "1": 0}, "score": 4.925362116075344}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9369222160596101, "4": 0.06263592397866657, "3": 0.00043162746124245083, "2": 3.2552352874021327e-06, "1": 0}, "score": 4.936490612271145}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9546823248269591, "4": 0.04487974049416446, "3": 0.00042654371466552087, "2": 2.997041267864473e-06, "1": 0}, "score": 4.954257796996173}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9415519005681289, "4": 0.0579639507769028, "3": 0.0004762425379464616, "2": 3.5919511761591774e-06, "1": 0}, "score": 4.941072534070815}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9504424138519995, "4": 0.049119037018876016, "3": 0.00042841620213334276, "2": 4.1427654915795576e-06, "1": 0}, "score": 4.950011402840613}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7839109886206083, "5": 0.189690895005722, "3": 0.025930232837705826, "2": 0.00036178950252640694, "1": 7.350273070401788e-05}, "score": 4.162821881548084}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6857001952132076, "4": 0.3075638410848976, "3": 0.006591894439028986, "2": 7.562686354496372e-05, "1": 0}, "score": 4.679003519677123}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5356473840383256, "5": 0.4527428113915474, "3": 0.011438093031225664, "2": 4.544348917852867e-05, "1": 0}, "score": 4.441269549627398}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6524884768116521, "5": 0.3316061531341704, "3": 0.01574255065317116, "2": 0.0001122179046074864, "1": 2.5096805270176033e-05}, "score": 4.315571924820445}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4952281566897924, "5": 0.49210774134022145, "3": 0.012495887360124226, "2": 0.00010510927864610559, "1": 0}, "score": 4.479431890131027}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6548375233971814, "3": 0.30198848242502707, "5": 0.03048588162743568, "2": 0.012483206724101662, "1": 0.0001985201404023337}, "score": 3.702933528359833}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.590451075171959, "3": 0.3947245733317882, "2": 0.007567867161821857, "5": 0.007151021967304185, "1": 7.742893577576119e-05}, "score": 3.5970471313529635}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8792018866709085, "3": 0.06831103901928551, "5": 0.0518854953964482, "2": 0.0005267237712842582, "1": 0}, "score": 3.9825197003442803}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8581773922414744, "3": 0.07216326193864032, "5": 0.06905278961605668, "2": 0.0005768360349714472, "1": 2.491822735505207e-05}, "score": 3.9956610800901684}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7599026241720628, "3": 0.15670414157620927, "5": 0.0805625884804511, "2": 0.0027084910697281524, "1": 9.092523341306897e-05}, "score": 3.918166133436418}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6221158621728112, "5": 0.2932552760397496, "3": 0.08336584382227584, "2": 0.0010867284696259257, "1": 0.00016158584637922203}, "score": 4.207234264839007}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8120696066654708, "4": 0.18441188825651939, "3": 0.0035019773950778635, "2": 4.0615901437809615e-06, "1": 0}, "score": 4.808569585793588}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.960862158292039, "4": 0.038854468091160624, "3": 0.00028035357039060926, "2": 2.9836507987866956e-07, "1": 0}, "score": 4.960583822394544}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9510830510675703, "4": 0.04856005498116334, "3": 0.00035158255831370936, "2": 4.159203755222555e-07, "1": 0}, "score": 4.95073529096705}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9371012921234365, "4": 0.06168934829551317, "3": 0.0012030948506525415, "2": 3.2199748789716156e-06, "1": 0}, "score": 4.935894606893294}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5562040642696292, "4": 0.4309849363298334, "3": 0.012658985496939447, "2": 9.436767210304402e-05, "1": 3.441868405152228e-05}, "score": 4.543265706106293}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8952339125947884, "4": 0.10253531532374588, "3": 0.0021905929902546954, "2": 1.34153095424441e-05, "1": 0}, "score": 4.893040390123471}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9171888542518429, "4": 0.08227049837682233, "3": 0.0005339141498498995, "2": 2.9445383805173146e-06, "1": 0}, "score": 4.916652523931162}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8356650784769516, "4": 0.16170469137298424, "3": 0.002602738809785203, "2": 1.3590697589902024e-05, "1": 0}, "score": 4.833046738157036}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9148019822214434, "4": 0.08409819287888783, "3": 0.0010823031090878184, "2": 9.522453707370567e-06, "1": 0}, "score": 4.913707943262583}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8268441863437709, "4": 0.16810217498727864, "3": 0.005004759096203692, "2": 1.1101303767632467e-05, "1": 0}, "score": 4.821848272645137}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9218600560239877, "4": 0.07704483144485622, "3": 0.0010554817301665308, "2": 2.9909679316164533e-06, "1": 0}, "score": 4.920832331500859}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8014913173434524, "4": 0.19495081168645056, "3": 0.0034752912170815213, "2": 7.340988877186786e-06, "1": 0}, "score": 4.798061389301254}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.953070441051721, "4": 0.04631180420279193, "3": 0.0005928222209212269, "2": 1.0694350923291107e-06, "1": 0}, "score": 4.952498209510612}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8646183355492625, "4": 0.13310029995197853, "3": 0.0022622402400706036, "2": 5.678877318279879e-06, "1": 0}, "score": 4.86235633226432}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6995493758637567, "5": 0.1962607395490691, "3": 0.10172129576117131, "2": 0.002275754803154945, "1": 0.00014223740929249362}, "score": 4.089565753677538}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5379866678905431, "5": 0.44876282060250344, "3": 0.013131670119672955, "2": 8.84911509690421e-05, "1": 0}, "score": 4.435467384718923}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6725584209352848, "5": 0.27628183305795084, "3": 0.05053394450949706, "2": 0.0005530922793108772, "1": 6.02569282803275e-05}, "score": 4.224463728292357}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7251477150384579, "4": 0.27134752488486186, "3": 0.0034791081387847227, "2": 9.068678541378343e-06, "1": 0}, "score": 4.72166243705795}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8494630287552322, "3": 0.09893865177186999, "5": 0.050281980832694806, "2": 0.0012424239613187192, "1": 7.061987058642863e-05}, "score": 3.9486464523263334}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"4": 0.656842549436465, "5": 0.26983408739242193, "3": 0.07276129698273155, "2": 0.00048038148946778574, "1": 6.466464182783378e-05}, "score": 4.19592136809814}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8157382724615284, "4": 0.17516981572451176, "3": 0.008996176727121954, "2": 8.361889890208781e-05, "1": 1.0035256655591844e-05}, "score": 4.806546430534333}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.499513377235444, "4": 0.49336064546276737, "3": 0.007102272327584825, "2": 1.253789374231076e-05, "1": 0}, "score": 4.492391527696182}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8962230027290906, "4": 0.10048288143214487, "3": 0.0032696739778720675, "2": 1.1147246959580143e-05, "1": 0}, "score": 4.892942905588493}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8980418483856578, "4": 0.09916399343360086, "3": 0.0027759792809504405, "2": 1.2112252674327857e-05, "1": 0}, "score": 4.8952470757474495}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6625753644044774, "3": 0.2618526599530115, "5": 0.05558366588132483, "2": 0.018369446699434057, "1": 0.0016173294138414442}, "score": 3.752139744157558}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7912069061567205, "3": 0.11086184417038329, "5": 0.09602677693507573, "2": 0.0017609197873401465, "1": 0.0001180555832398135}, "score": 3.9812884493450142}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7841508942465056, "5": 0.1587402913388701, "3": 0.05624738656745368, "2": 0.000787390141384299, "1": 6.833578432271015e-05}, "score": 4.100713691397239}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.656892858933904, "3": 0.28161902404560174, "5": 0.04321008335382514, "2": 0.01722874619168216, "1": 0.0010386966218731727}, "score": 3.724014554137921}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7604279363680881, "5": 0.1558226153172038, "3": 0.08209865870415696, "2": 0.0014591279736873, "1": 0.00017692139855178467}, "score": 4.070275972354597}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6933329831688074, "5": 0.27475551860105946, "3": 0.03147131761057881, "2": 0.00034699659178878076, "1": 8.935824884740794e-05}, "score": 4.242323060134816}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9594274583385838, "4": 0.04031162460043393, "3": 0.0002345042140211401, "2": 2.8837907201423716e-07, "1": 0}, "score": 4.959217436411535}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8698448209211921, "4": 0.12579723679759464, "3": 0.004305629183419676, "2": 3.8068172210663504e-05, "1": 1.3350616425356539e-05}, "score": 4.865423777500483}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7935192338920412, "4": 0.20303757876569734, "3": 0.003427094024769114, "2": 1.1467254718246258e-05, "1": 2.77597089468011e-06}, "score": 4.790062339133069}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7280292303586154, "4": 0.2632285007155468, "3": 0.008634674185003447, "2": 8.740928895504791e-05, "1": 1.807505042786433e-05}, "score": 4.719167030175563}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6541979941459669, "5": 0.2621749106669431, "3": 0.08113345398654502, "2": 0.0022426613851471346, "1": 0.00023732168891131116}, "score": 4.175846570578074}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6802876197623027, "4": 0.3097486242400314, "3": 0.009814719798054912, "2": 5.87134926377988e-05, "1": 0}, "score": 4.670416026769309}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9502744551055943, "4": 0.04888345418416881, "3": 0.000824909396569919, "2": 4.285458544876831e-06, "1": 0}, "score": 4.9494532188030895}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7938876630891805, "4": 0.20405918595220335, "3": 0.0020246861056386874, "2": 7.475825574776097e-06, "1": 0}, "score": 4.791864645801142}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8782571997791545, "4": 0.1197946083187662, "3": 0.0018895958665445364, "2": 9.496255452073894e-06, "1": 0}, "score": 4.8763916420385955}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6664012649147021, "5": 0.2909315391912233, "3": 0.042440860065345566, "2": 0.0002143935957034319, "1": 8.383098184857598e-06}, "score": 4.24803762543927}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9845691240760299, "4": 0.015224819819070716, "3": 0.00013854532909482624, "2": 2.1015489140225906e-07, "1": 0}, "score": 4.984496415657213}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6576906730085715, "5": 0.30256813112847897, "3": 0.03948458248910431, "2": 0.00015969912209051916, "1": 0}, "score": 4.262789618454434}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8850893399262614, "4": 0.11068433033604803, "3": 0.004214135539590699, "2": 9.093433484740283e-06, "1": 1.8545119430495487e-06}, "score": 4.880852551748719}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9463474387045497, "4": 0.05226164720313305, "3": 0.0013618284958479383, "2": 2.8809426740344245e-06, "1": 0}, "score": 4.945004611842041}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8361994565200747, "3": 0.08678955488352356, "5": 0.07566715473101658, "2": 0.0012314299793978246, "1": 0}, "score": 3.9864132126810046}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7862932378370209, "4": 0.20467913933167048, "3": 0.008595799717268584, "2": 0.000276045182758139, "1": 0.00011968551064144099}, "score": 4.776814328331809}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5464850432459436, "5": 0.4300633308899124, "3": 0.023068759024173, "2": 0.00031230227782308483, "1": 4.1899360235300316e-05}, "score": 4.4062559146372084}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8092471726276919, "4": 0.18852912023880675, "3": 0.002200681926624728, "2": 1.1086327119058524e-05, "1": 0}, "score": 4.807033953128156}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5830589399833976, "4": 0.4025257737548817, "3": 0.014231515104360543, "2": 0.000148451537468168, "1": 1.9992946932142278e-05}, "score": 4.568479255858945}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7319288274555308, "5": 0.1456135622843743, "3": 0.11973686925721481, "2": 0.0025716977373070188, "1": 0.00014415102835245024}, "score": 4.0203009437845205}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5414551724466063, "4": 0.44998622850872816, "3": 0.008510320291764507, "2": 4.08608976458262e-05, "1": 3.903972240368715e-06}, "score": 4.532853290826957}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6177916341164952, "5": 0.36046738424921854, "3": 0.02159570341609373, "2": 0.00012514305938428908, "1": 1.241274240102727e-05}, "score": 4.33858677119519}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7321801930102397, "5": 0.2386344728694275, "3": 0.02897704251267668, "2": 0.00019045683061929308, "1": 1.3926431175742886e-05}, "score": 4.209235555166902}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6559079172084001, "4": 0.339296745175841, "3": 0.004748896517640033, "2": 1.6908163590082905e-05, "1": 0}, "score": 4.651144434569534}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9943361928765422, "4": 0.005648803647782339, "3": 1.2448679561444148e-05, "1": 0, "2": 0}, "score": 4.994326284497909}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9973206967571189, "4": 0.0025698732509184265, "3": 1.3765845463587623e-05, "1": 0, "2": 0}, "score": 4.997402346555854}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9867017140168219, "4": 0.013127926814155392, "3": 0.00013207983600328692, "1": 0, "2": 0}, "score": 4.9866074008540755}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9944438140160471, "4": 0.005537124257993658, "3": 1.1263490411818638e-05, "1": 0, "2": 0}, "score": 4.994440305405375}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9910740697632194, "4": 0.008883887821995649, "3": 2.6187195186656678e-05, "1": 0, "2": 0}, "score": 4.991063596098984}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8394987176349621, "5": 0.12940205707719515, "3": 0.03097142728524585, "2": 0.00010283158551952736, "1": 0}, "score": 4.098227419007621}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8514497279698772, "5": 0.12130885073868214, "3": 0.027164690293020533, "2": 3.8158424458946794e-05, "1": 0}, "score": 4.094071472175562}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8564996755732462, "3": 0.13036062899018294, "5": 0.012577560065237333, "2": 0.0005553963249812192, "1": 5.900732867123036e-06}, "score": 3.8810883365412394}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9009526279031839, "5": 0.08550632749399462, "3": 0.013515812265822151, "2": 1.3717845246566736e-05, "1": 0}, "score": 4.071963908165506}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8981371356806732, "3": 0.05108728697025599, "5": 0.05027760649064899, "2": 0.00017266711635563985, "1": 0}, "score": 3.9988446094348076}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5052928079567471, "4": 0.48212618721197364, "3": 0.012415363268487816, "2": 4.661549786090965e-05, "1": 0}, "score": 4.492842874840559}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8930981444011779, "4": 0.10531333812606908, "3": 0.0014468633102950957, "2": 4.18957609413156e-06, "1": 0}, "score": 4.89176548811265}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7664589325439538, "4": 0.22793102904042184, "3": 0.005551361866353015, "2": 1.850014477934643e-05, "1": 0}, "score": 4.7609011406600485}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6202540914369374, "4": 0.37430069772270774, "3": 0.005363486762505675, "2": 1.2131854030327634e-05, "1": 0}, "score": 4.614909133860443}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8438039146435847, "4": 0.15403728430419636, "3": 0.0021108018077590474, "2": 5.5536343871029145e-06, "1": 0}, "score": 4.8417177327897285}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8906691952673207, "4": 0.10657671761180247, "3": 0.0026882888581110133, "2": 3.678689096607874e-05, "1": 0}, "score": 4.887933092784365}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8842581359302006, "4": 0.11199788408093615, "3": 0.003531421845645489, "2": 2.422716581635159e-05, "1": 0}, "score": 4.880844149992629}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5856687630426699, "4": 0.4045959597851122, "3": 0.009646906355035541, "2": 5.137450603934679e-05, "1": 0}, "score": 4.575940415346362}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9226094270443375, "4": 0.07584022911566861, "3": 0.0014553192305267347, "2": 8.834138207155434e-06, "1": 0}, "score": 4.921215839564741}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9185158023102434, "4": 0.08006177938671555, "3": 0.0013893920522455442, "2": 6.827124385851668e-06, "1": 0}, "score": 4.917136784191771}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7719888593154687, "4": 0.2226837668125487, "3": 0.005206026407032204, "2": 2.8250341837572184e-05, "1": 0}, "score": 4.766797718886399}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7976749462837378, "4": 0.19977488926906545, "3": 0.0025326383335914204, "2": 1.0887872530739475e-05, "1": 0}, "score": 4.7951258104419}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5561273857012469, "4": 0.42983210501277125, "3": 0.013902744670895738, "2": 0.00010813609340605147, "1": 2.016588989380449e-05}, "score": 4.541952999475536}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6620063572463997, "4": 0.3316545711669584, "3": 0.0062846445112213, "2": 4.04575209390018e-05, "1": 7.68215846624201e-06}, "score": 4.655621873372255}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.556060153964556, "4": 0.4238779368435127, "3": 0.01977616409613161, "2": 0.00019496412318388185, "1": 4.8117481795090504e-05}, "score": 4.53577256710467}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6049289656460086, "5": 0.28791355504379, "3": 0.10452308739182085, "2": 0.0024325796508507897, "1": 0.0001953765179177684}, "score": 4.177940323975886}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8417949093525148, "3": 0.11650614040806515, "5": 0.04035570929401844, "2": 0.001295214448814811, "1": 2.4432948211810427e-05}, "score": 3.9211839815941447}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5441663437036611, "5": 0.44608658902944526, "3": 0.009725516308875084, "2": 1.7182072744419167e-05, "1": 0}, "score": 4.436328614844741}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.752643329048472, "4": 0.24399076567484387, "3": 0.003347394489798302, "2": 1.2162063501207192e-05, "1": 0}, "score": 4.749276367380067}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6756868634548003, "5": 0.2954493680893952, "3": 0.028654605451403376, "2": 0.00018029070176399462, "1": 0}, "score": 4.266441874024886}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.42051164783014017, "5": 0.25030805491987057, "3": 0.2425411723814053, "2": 0.06459833774669181, "1": 0.02197504033319146}, "score": 3.812632767251647}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5945497574822419, "4": 0.35566034167085503, "3": 0.044046851709238596, "2": 0.003634073803685082, "1": 0.0020839888612394467}, "score": 4.536996209223058}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3269117245611206, "3": 0.28611155264398946, "5": 0.20455583683708203, "2": 0.11148224928423921, "1": 0.07092219839635566}, "score": 3.4827046869917915}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5163107841205644, "5": 0.44948129447838986, "3": 0.03316453158100112, "2": 0.0008582269353788455, "1": 0.00018326818245343555}, "score": 4.414051288983163}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.46026296030190705, "5": 0.447375183377237, "3": 0.08274534666183293, "2": 0.007815619872156754, "1": 0.0017485262302510299}, "score": 4.3437710193535715}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8767837291878278, "4": 0.11120550422104139, "3": 0.0108506586040911, "2": 0.0007039931021053808, "1": 0.00042157072542318465}, "score": 4.8632901938374165}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.521910511345523, "5": 0.43198470346964857, "3": 0.04551054143357842, "2": 0.0004267534977809741, "1": 0}, "score": 4.385685253561386}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5543184432848263, "5": 0.4046980562711661, "3": 0.040707146999357076, "2": 0.0001957588526206955, "1": 0}, "score": 4.363628698073139}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6124428543109798, "5": 0.3161280265927118, "3": 0.0704175188129856, "2": 0.0009058281045496243, "1": 9.42828736884219e-05}, "score": 4.243618801960301}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6435334126396396, "5": 0.2862511519048608, "3": 0.0684726420240644, "2": 0.0014555714592043689, "1": 0.0002049964286904107}, "score": 4.214269996143214}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9311235162401765, "4": 0.06813774233770047, "3": 0.0007277747259726577, "2": 3.5722318122831183e-06, "1": 0}, "score": 4.930395476826754}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9967153931623635, "4": 0.003264596850460191, "3": 1.4376422782568495e-05, "1": 0, "2": 0}, "score": 4.996706631750572}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9498011329858621, "4": 0.04970279052855143, "3": 0.00045580658232492424, "2": 1.6513606062619081e-06, "1": 0}, "score": 4.949378687303655}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9847525540815594, "4": 0.015209719723515713, "3": 2.7894779537391084e-05, "1": 0, "2": 0}, "score": 4.984734340634373}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929855350117621, "4": 0.006994172336667831, "3": 1.9299893117927233e-05, "1": 0, "2": 0}, "score": 4.992967220895245}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7603037382125013, "3": 0.15019261629724, "5": 0.08228933224935525, "2": 0.007037327481435772, "1": 0.00017341361132752628}, "score": 3.917501525458489}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.48434179184325565, "4": 0.44044508787631953, "2": 0.05189669868425568, "5": 0.02023346018833, "1": 0.0030556345477166288}, "score": 3.4229155974286654}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5724288103610544, "4": 0.2899910263793096, "2": 0.12782949159581708, "5": 0.005978457424889433, "1": 0.003771975912880522}, "score": 3.1665745375065617}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7191863826700602, "5": 0.15872003736992596, "3": 0.11885678476681272, "2": 0.0031084617167420436, "1": 0.0001265817770206278}, "score": 4.033266642111725}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5201360328415685, "4": 0.36001020525615957, "2": 0.10432227219819687, "5": 0.010821217378679986, "1": 0.004709637678129164}, "score": 3.267911262488214}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7227296318084351, "5": 0.1727762282626493, "3": 0.10262027024687467, "2": 0.001648181862705387, "1": 0.0001936405408165132}, "score": 4.066280796787069}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9255926814047652, "4": 0.07176992948889166, "3": 0.0026038191705506156, "2": 1.554006547054288e-05, "1": 0}, "score": 4.922974423212435}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9437388113616634, "4": 0.05495670420632325, "3": 0.0012924159276537506, "2": 7.70017116600813e-06, "1": 2.6072487796641185e-06}, "score": 4.942424833035023}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9160670759218982, "4": 0.08125874766486718, "3": 0.002646884476157292, "2": 1.7799930591994306e-05, "1": 8.23035013860365e-06}, "score": 4.9133610528819105}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6408681868160788, "4": 0.33741117111775937, "3": 0.021401790333708575, "2": 0.0002560837547499933, "1": 5.570553746966688e-05}, "score": 4.618791482538324}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6003748312929368, "2": 0.1309893836375123, "3": 0.1212822384962998, "5": 0.08727471426133554, "4": 0.06007205023129956}, "score": 1.9028749917403327}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6221236137847463, "4": 0.2524763495000327, "3": 0.08273545918369545, "1": 0.02841201670190176, "2": 0.014232773225903909}, "score": 4.425694981527139}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8669387245142167, "4": 0.0867606587732167, "3": 0.028715268333334404, "1": 0.013829918863852651, "2": 0.0037255253631804036}, "score": 4.7893062523972665}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9032206439076049, "4": 0.07236291026592968, "3": 0.013939319377293936, "1": 0.008540329404244078, "2": 0.0019296570232846001}, "score": 4.859807161312751}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9730185833060953, "5": 0.02022905179766657, "2": 0.0038352544383049437, "3": 0.002317749284921349, "4": 0.0005986950428042606}, "score": 1.0911831060670483}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8595061318317335, "2": 0.07072960871807099, "5": 0.03826347856487777, "3": 0.02164797635073552, "4": 0.009847963464972418}, "score": 1.2966248020552853}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4926115236722494, "4": 0.41431285588652234, "3": 0.08570923496206936, "1": 0.0038607840282644467, "2": 0.00344756877243922}, "score": 4.388447341720186}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5207479164006481, "5": 0.3252013987885265, "3": 0.13670555495184294, "2": 0.009763083461691725, "1": 0.007506116931400216}, "score": 4.146462446934468}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.44739918122568983, "1": 0.43518689347062667, "4": 0.0626663912360106, "3": 0.035180567798268496, "2": 0.019555480487401418}, "score": 3.0675362619655173}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9130128217025147, "4": 0.07888151992873377, "3": 0.007731093225937304, "2": 0.0001626358346224305, "1": 0.00015653577184714242}, "score": 4.9045369549924835}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8728925343284493, "5": 0.09110393330155701, "3": 0.03588756580104601, "2": 9.768495525253145e-05, "1": 0}, "score": 4.055022003481018}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8901747920297374, "3": 0.08575790590869838, "5": 0.02388078782512601, "2": 0.00018132419432310076, "1": 2.508677088846493e-06}, "score": 3.9377525405883533}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8178373015686698, "3": 0.13722651834075, "5": 0.04409728778035006, "2": 0.0007973336774320654, "1": 2.97496556746785e-05}, "score": 3.9051857334582065}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8668582763334352, "3": 0.12386557177818745, "5": 0.008887862473883054, "2": 0.00038367911221351495, "1": 3.362573347134571e-06}, "score": 3.8842447003199907}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8480518849325451, "3": 0.13982216693293142, "5": 0.011846918350870084, "2": 0.0002697324543652159, "1": 0}, "score": 3.87148409165449}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7530093908587868, "4": 0.2261237416781786, "3": 0.0207293045727041, "2": 0.00012344819050452908, "1": 1.0492624250178609e-05}, "score": 4.73200436340745}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.697531182634424, "5": 0.2546706849522234, "3": 0.047493496172524616, "2": 0.00027581560868214267, "1": 2.7403220910521418e-05}, "score": 4.206543640656879}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5645091423730533, "5": 0.38699515709386373, "3": 0.04806208818862769, "2": 0.0003800149362861954, "1": 3.40188083341745e-05}, "score": 4.338077601693739}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5090989095465632, "5": 0.4746609116901996, "3": 0.01619374860173216, "2": 3.3663580577754545e-05, "1": 0}, "score": 4.458405688200627}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7257619866421573, "4": 0.2693211083362385, "3": 0.004901632333769994, "2": 7.054548301573425e-06, "1": 0}, "score": 4.720852169275495}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8135191600404276, "4": 0.16896945838604854, "3": 0.01619640459428828, "1": 0.0005672320946417263, "2": 0.000560723132062938}, "score": 4.794648229402597}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9919162159420751, "4": 0.007769697866336388, "3": 0.00026601815490208636, "2": 2.9599682974695545e-06, "1": 0}, "score": 4.991689011026307}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9156031376784273, "4": 0.07825771188321179, "3": 0.005765033582728141, "2": 0.0002222479294331356, "1": 0.00013437475262691807}, "score": 4.909006386294453}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9845305267692288, "4": 0.014811431466077973, "3": 0.0006323066979259597, "2": 6.606364866033304e-06, "1": 0}, "score": 4.983903828144599}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9505339620227262, "4": 0.048378228056906336, "3": 0.001065439914340718, "2": 7.123210651366248e-06, "1": 0}, "score": 4.94946875204286}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9837597413871838, "4": 0.01612283482071974, "3": 0.0001159402019737645, "2": 2.3794030834617731e-07, "1": 0}, "score": 4.983644550581245}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9401066497246318, "4": 0.05928723248226763, "3": 0.0005923111321943791, "2": 6.808080060421516e-07, "1": 0}, "score": 4.939525309047428}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.62809741821395, "4": 0.3678237484400951, "3": 0.004065038763953132, "2": 5.590778577972052e-06, "1": 0}, "score": 4.624026317282079}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5702244065098592, "4": 0.4169050837493622, "3": 0.01281793393491776, "2": 2.6516271355131763e-05, "1": 0}, "score": 4.557367964781942}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9876851343063899, "4": 0.012152108319627427, "3": 0.0001422307242913556, "2": 2.416839393842025e-07, "1": 0}, "score": 4.987562452884754}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6912174747883651, "4": 0.2939173128531869, "3": 0.014576676902776102, "2": 0.00011085067861490885, "1": 0}, "score": 4.67653930726434}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7534550783590016, "4": 0.24352545595840114, "3": 0.003010050268086015, "2": 4.154065768768651e-06, "1": 0}, "score": 4.7504406682894444}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8934938834618374, "4": 0.10578165159245378, "3": 0.0007072518726467213, "2": 2.0524199450709524e-06, "1": 0}, "score": 4.892796062120702}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9541038080347392, "4": 0.045574341829626004, "3": 0.00031067351133353744, "2": 4.3800128183952e-07, "1": 0}, "score": 4.953802501046336}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7987059368061229, "4": 0.19879011685589457, "3": 0.002397288432853427, "2": 3.1652674612955425e-06, "1": 0}, "score": 4.79638473779546}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9153803518479469, "4": 0.08372932537049797, "3": 0.0008826012895932449, "2": 3.954944459315109e-06, "1": 0}, "score": 4.914493285151836}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6878828580552566, "4": 0.3092239213388272, "3": 0.0028435002593767454, "2": 1.3714759078593196e-05, "1": 0}, "score": 4.6850365934227005}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8356265301360057, "4": 0.1630400667661527, "3": 0.0013148235563968705, "2": 5.14394378168015e-06, "1": 0}, "score": 4.834312628180843}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8597935815481352, "4": 0.13921683462448317, "3": 0.0009823705290033981, "2": 2.806394484779872e-06, "1": 0}, "score": 4.858809382920574}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8670291422685482, "4": 0.1309692390194697, "3": 0.0019613681765550434, "2": 1.3058360212507662e-05, "1": 0}, "score": 4.865065180375526}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7189616936071912, "5": 0.18420844671430467, "3": 0.09519713806301378, "2": 0.0014466814510070876, "1": 0.00016560601404097406}, "score": 4.0856228773379115}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5958282646496346, "5": 0.2383596288984055, "3": 0.16182328054577988, "2": 0.003637507807845844, "1": 0.00032943120890705575}, "score": 4.068274533427377}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7942750239016696, "5": 0.16932329556300763, "3": 0.03613182583314289, "2": 0.000193925789584182, "1": 0}, "score": 4.132813702550709}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7247784913379851, "3": 0.1453818281541851, "5": 0.12770623394816005, "2": 0.0019113994669721517, "1": 0.00019878633570149173}, "score": 3.9779047339003104}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8335596363839094, "5": 0.09465301950874504, "3": 0.070583138108438, "2": 0.0011139143784400145, "1": 8.484902985474689e-05}, "score": 4.021587623046457}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9869803357494135, "2": 0.012639700312482476, "3": 0.0003550368397249129, "4": 1.3016757397662273e-05, "5": 1.008782809489979e-05}, "score": 1.0134292000513951}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9979932017176865, "2": 0.0018579263105624549, "3": 0.00010998275249121184, "5": 3.1405579178169896e-05, "4": 7.075722496515466e-06}, "score": 1.0022247422072585}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9999323394050813, "2": 6.467026789640316e-05, "3": 2.1604954231463892e-06, "5": 5.462445869824439e-07, "4": 8.381079660405716e-08}, "score": 1.00007142768375}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9973876894371857, "2": 0.0025102799454647822, "3": 8.838604170966532e-05, "5": 8.478822278990531e-06, "4": 5.119662699944796e-06}, "score": 1.002736326432219}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9992541374538568, "2": 0.0007140572619720775, "3": 2.7338475199638003e-05, "5": 3.1947523016827445e-06, "4": 1.1245669834525798e-06}, "score": 1.000784887038291}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7195653714546072, "3": 0.19453098941563537, "5": 0.0809846863168538, "2": 0.004738466589210284, "1": 0.0001790477549992005}, "score": 3.8764394427198066}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6121082702155515, "5": 0.3228304229404174, "3": 0.06471020253698476, "2": 0.00032757517082176746, "1": 1.8747259054382667e-05}, "score": 4.257410059187911}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8126371248272332, "3": 0.11483864762103281, "5": 0.07179787496167504, "2": 0.0006951561926661973, "1": 2.33834044207369e-05}, "score": 3.9554984170514924}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7784085376239107, "5": 0.14074249990853333, "3": 0.08024773834387425, "2": 0.0005694788008009445, "1": 2.8739904506145625e-05}, "score": 4.059269762379972}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6066703294758967, "5": 0.3800010245808294, "3": 0.013236183835058436, "2": 4.9382077660160254e-05, "1": 0}, "score": 4.366681873256755}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8617345089637507, "4": 0.13545969998289834, "3": 0.002762815529050239, "2": 2.758705271042353e-05, "1": 0}, "score": 4.858929736945135}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8440226147649089, "4": 0.15234024588267042, "3": 0.0035259019609557678, "2": 1.0089896311644228e-05, "1": 0}, "score": 4.840561553707009}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5306058033517073, "5": 0.44161438933733144, "3": 0.027572433268674323, "2": 0.00013274480929004008, "1": 0}, "score": 4.4138073485751095}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5366031342847167, "4": 0.44875594112119493, "3": 0.014463033480300666, "2": 0.0001232558847168436, "1": 0}, "score": 4.521922104368712}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9200712925860848, "4": 0.07828014375777159, "3": 0.0016260449885570638, "2": 1.2309626000404486e-05, "1": 0}, "score": 4.918430004635638}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7239951395121238, "5": 0.20822959207002825, "3": 0.0672588547515354, "2": 0.0004809778205713191, "1": 2.4787526376847893e-05}, "score": 4.139935909180472}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7534106860935936, "4": 0.23645161020450572, "3": 0.010074316647505877, "2": 4.8439207493176336e-05, "1": 0}, "score": 4.743250601027295}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7860418607652735, "5": 0.1759841050919349, "3": 0.03773957501382788, "2": 0.00020844256964816355, "1": 0}, "score": 4.137831230833203}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.624471928991516, "4": 0.36696529479146256, "3": 0.008523894002551966, "2": 3.040027206760122e-05, "1": 0}, "score": 4.615892458409188}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9440775082595652, "5": 0.04154051761381432, "3": 0.014322078232669073, "2": 5.870427534303125e-05, "1": 9.586382970467189e-07}, "score": 4.027098161228906}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3240630770126847, "4": 0.2393761056869835, "2": 0.23718641164208162, "1": 0.16479699432372458, "5": 0.03455729526904371}, "score": 2.7417051000584194}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4833129526769259, "5": 0.3052894915232263, "3": 0.17255091959699886, "2": 0.023299019519594465, "1": 0.01551794783649174}, "score": 4.039587863903831}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5883413925449418, "5": 0.36736792965807985, "3": 0.04349322935557612, "2": 0.0005383121293261509, "1": 0.00021285295133260143}, "score": 4.322174428505151}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5482266404884878, "5": 0.24786129094385487, "3": 0.17880109358754326, "2": 0.02062576822876065, "1": 0.004473082547880758}, "score": 4.014389587717438}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6066467729243565, "4": 0.325405298920913, "3": 0.062111085220923255, "2": 0.004296745943902043, "1": 0.0015036060839902735}, "score": 4.53145077068373}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6158219496533905, "4": 0.3057973962730629, "3": 0.07327192195667523, "2": 0.003586234904317396, "1": 0.0015128439332878984}, "score": 4.530844150475048}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8643371036600009, "4": 0.1271363940395657, "3": 0.008422260658553074, "2": 7.711012215154405e-05, "1": 2.3849089916387912e-05}, "score": 4.855691884235946}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6906482843143806, "5": 0.23644418574050996, "3": 0.07089653629659305, "2": 0.0017696673286083282, "1": 0.00023855969152967774}, "score": 4.161293081950129}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6084564126096229, "4": 0.35016769873723225, "3": 0.039057451556161964, "2": 0.0015229668066819822, "1": 0.0007875531480141695}, "score": 4.563994833223399}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.906554417728924, "4": 0.0913556087112193, "3": 0.002068285036232482, "2": 1.3980766420805215e-05, "1": 6.841579034330268e-06}, "score": 4.904438429827571}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4088989702322556, "4": 0.40340659704052323, "2": 0.0949906132650232, "5": 0.06503547426728376, "1": 0.02763946876659009}, "score": 3.383219060774629}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7296276817111043, "5": 0.18326393453273948, "3": 0.08507135534555552, "2": 0.0018659909994770407, "1": 0.00016687008206759776}, "score": 4.093960378505843}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7223525954130862, "5": 0.22277276902722515, "3": 0.05403774473576416, "2": 0.000732714080283444, "1": 8.238262540645755e-05}, "score": 4.167026088440994}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6585597337946303, "5": 0.3194807683289024, "3": 0.021760023000210196, "2": 0.00015861336241677093, "1": 0}, "score": 4.297415671458434}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6312002584451912, "5": 0.3179909359214043, "3": 0.04913746502561841, "2": 0.001382708530690342, "1": 0.00026277510649086656}, "score": 4.265306588539593}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5243459828136369, "5": 0.4489025511931486, "3": 0.02653668403624115, "2": 0.00019545878874860676, "1": 1.8000482407690214e-05}, "score": 4.421921506201779}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7193643889416309, "4": 0.2742121231583374, "3": 0.006386569558825033, "2": 1.7480807380286138e-05, "1": 0}, "score": 4.712956715888327}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.49276857847850075, "5": 0.46742570624736235, "3": 0.03950121294808786, "2": 0.00025610629111199663, "1": 3.742932761531361e-05}, "score": 4.427304678859556}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.708119616287621, "4": 0.2760403026034222, "3": 0.015683178094490727, "2": 0.00013123853666527718, "1": 2.1907248372259505e-05}, "score": 4.692110839793897}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6316170702316447, "4": 0.346238892990803, "3": 0.021904497455039796, "2": 0.00019999483834985506, "1": 2.6470570215609443e-05}, "score": 4.609241136555451}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"4": 0.538596369096697, "3": 0.31735603390579376, "5": 0.12943929140491747, "2": 0.013725618895978692, "1": 0.0008703353158968345}, "score": 3.7820183213847733}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5304668028410912, "5": 0.41632369846092504, "3": 0.052432041265346604, "2": 0.0006747724736423935, "1": 8.062530499272404e-05}, "score": 4.362308228727483}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7490886385076593, "5": 0.19183516333390263, "3": 0.05779040040821225, "2": 0.0011627326633640402, "1": 0.0001147757882577789}, "score": 4.131376059249574}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6791492072379295, "4": 0.3147692337192973, "3": 0.006052605732966374, "2": 1.9441881084642104e-05, "1": 0}, "score": 4.673064119544192}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5488716244841573, "3": 0.27450425973298676, "5": 0.15696847342630074, "2": 0.018071983731889937, "1": 0.0015716573177371902}, "score": 3.8416033733097894}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.584815755043857, "3": 0.27523654153420485, "5": 0.07622893225249239, "2": 0.05466988880544586, "1": 0.009044500369219869}, "score": 3.664517641917794}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4701597069388986, "3": 0.30046004367122103, "5": 0.15459810505294821, "2": 0.061837852624916034, "1": 0.012936722582546389}, "score": 3.6916498544420824}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.37430905595060715, "4": 0.2869467558843856, "2": 0.1849743892451007, "5": 0.09092779035913369, "1": 0.0628400920980395}, "score": 3.158148066246349}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5833847860297835, "3": 0.26507920787908384, "5": 0.08726092594578787, "2": 0.04784641909182718, "1": 0.016425134925547452}, "score": 3.6772123369158005}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.34831936657922774, "3": 0.31162934319102437, "2": 0.22117226532354248, "1": 0.06589041471668187, "5": 0.05298787315536437}, "score": 3.101342092825634}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7558851744398298, "5": 0.12533902663660354, "3": 0.11748219368360466, "2": 0.001207104695938592, "1": 8.150020682423524e-05}, "score": 4.005198148933147}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.64619769022151, "3": 0.28799161898965214, "5": 0.06027336385220253, "2": 0.005328525610448483, "1": 0.0001728965706100631}, "score": 3.7610974261913035}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7834891699001306, "3": 0.11261513032139621, "5": 0.10273064635391817, "2": 0.0010735718631881357, "1": 7.161593162643372e-05}, "score": 3.987753281222486}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6037801725656862, "5": 0.3474288094003368, "3": 0.048385698232001, "2": 0.0003670665467694733, "1": 3.08298247648194e-05}, "score": 4.298218702406296}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7407328092649361, "3": 0.19475093367877977, "5": 0.06264226931915168, "2": 0.0017509802587742018, "1": 0.0001051988699119718}, "score": 3.864071357813122}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5686391663833843, "4": 0.39716647646814307, "3": 0.033401916513566006, "2": 0.0007101642334213999, "1": 7.936909477931858e-05}, "score": 4.533580365400412}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.670667576380084, "4": 0.31908473005758153, "3": 0.010185297704805635, "2": 5.0802245581326534e-05, "1": 7.829099977269741e-06}, "score": 4.660359672816077}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7337883818813038, "3": 0.21456366030654914, "5": 0.04812042287443478, "2": 0.0033681151289714204, "1": 0.0001518312274093364}, "score": 3.826363720974689}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6178749921869792, "5": 0.3357803342268095, "3": 0.04596298409590437, "2": 0.00032564751626775905, "1": 0}, "score": 4.289182261443158}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5377049711490091, "5": 0.44257408713282104, "3": 0.01965056083210715, "2": 6.51124358572497e-05, "1": 4.4928019883114265e-06}, "score": 4.422780150951705}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9952750409062419, "4": 0.0046832826218680245, "3": 3.457125505312435e-05, "1": 0, "2": 0}, "score": 4.995247541100775}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9956555356078093, "4": 0.004260098486804094, "3": 7.39809448460398e-05, "1": 0, "2": 0}, "score": 4.9955918938454955}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9976084237862365, "4": 0.002370365775712409, "3": 1.4114611790031898e-05, "1": 0, "2": 0}, "score": 4.997601387980573}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9936491663357935, "4": 0.006227184341181297, "3": 0.00011566921907478715, "1": 0, "2": 0}, "score": 4.993541425680574}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976284739218209, "4": 0.002350873071582804, "3": 1.2029904096953836e-05, "1": 0, "2": 0}, "score": 4.997625046640756}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7302594916425426, "3": 0.13438080245124, "5": 0.13328214590039228, "2": 0.0019566596888344824, "1": 0.00010035677211964342}, "score": 3.9946868446040784}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.49959535410666667, "3": 0.34355519365811815, "5": 0.13770078120840057, "2": 0.015998776954625076, "1": 0.0031383393135622794}, "score": 3.7527301585570116}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4630061231672921, "3": 0.44522617389071717, "5": 0.0771317716221105, "2": 0.013204103849752073, "1": 0.0014120096579874845}, "score": 3.6012534587738814}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5700375745859285, "5": 0.28750129914204564, "3": 0.1406932486530378, "2": 0.0015593871304633406, "1": 0.00013591674891411535}, "score": 4.143291925212208}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4777915927483733, "3": 0.3633473918538082, "5": 0.1335304416226652, "2": 0.02173041471478819, "1": 0.003584480588807004}, "score": 3.7159643253276124}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5113537286397886, "4": 0.29054482838997636, "2": 0.16059920944354358, "1": 0.019241374434335566, "5": 0.0182593135065725}, "score": 3.1279816948975947}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.41639310540636665, "2": 0.3619314679984886, "4": 0.16138176656580838, "1": 0.05083316414008958, "5": 0.009458378656344026}, "score": 2.7167001277880183}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4248305650578628, "3": 0.4136538359373362, "5": 0.0860597032287708, "2": 0.06579650878744851, "1": 0.009643447594609432}, "score": 3.5118747265116674}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6437162342695126, "3": 0.2310447186422591, "5": 0.10771415215183121, "2": 0.015958143751844192, "1": 0.001564351371511523}, "score": 3.84005970806455}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5448091931127581, "3": 0.31523323045026264, "5": 0.1002680278535155, "2": 0.035447877530382824, "1": 0.00420581999420905}, "score": 3.7015108812088897}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7152076921052146, "3": 0.22014899761098145, "5": 0.05166480932115365, "2": 0.012030628571837447, "1": 0.0009438115886817682}, "score": 3.804622326410379}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5383759667112509, "5": 0.44104196029515713, "3": 0.02028934312481333, "2": 0.00026190217546844934, "1": 2.0844957197577855e-05}, "score": 4.4201704723987625}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8763964692200998, "4": 0.12277353494164339, "3": 0.0008197652821182897, "2": 2.8335109411187683e-06, "1": 0}, "score": 4.875577513602541}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5460283617441227, "4": 0.43753270136529154, "3": 0.01629081218048372, "2": 0.00013592191384870724, "1": 8.766003997013384e-06}, "score": 4.529441227303461}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.754139941039328, "5": 0.13167875458347827, "3": 0.11194204466086165, "2": 0.002164018433025966, "1": 7.279407452220904e-05}, "score": 4.015190328006902}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"4": 0.724471018566577, "5": 0.21854701848973082, "3": 0.05538966250627551, "2": 0.0013587936431107262, "1": 0.0002304764200252939}, "score": 4.1597488235358835}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9703641039689994, "4": 0.02918610322337645, "3": 0.0004296989546199463, "2": 3.393346348522253e-06, "1": 0}, "score": 4.969943816874852}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6988728402247268, "4": 0.2927885801135573, "3": 0.008205250703010905, "2": 9.504073203415738e-05, "1": 2.8244212178485518e-05}, "score": 4.690399709805802}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9573774650067327, "4": 0.04201803702126521, "3": 0.0005902205956571429, "2": 3.6424391666676526e-06, "1": 0}, "score": 4.95679013493572}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8856541273897268, "4": 0.11236915510014996, "3": 0.0019373678606837126, "2": 2.3688117662496365e-05, "1": 8.56635702779338e-06}, "score": 4.883649953873475}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9792502276131717, "4": 0.020481295991049756, "3": 0.0002556950588158285, "2": 4.272818376988686e-07, "1": 0}, "score": 4.979005772681964}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.992765659236613, "4": 0.007211538256681399, "3": 2.0352211067749647e-05, "2": 7.280297625178331e-08, "1": 0}, "score": 4.992747521669541}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9844216958886606, "4": 0.015393462079461592, "3": 0.00012151765464735252, "2": 3.202057753021743e-07, "1": 0}, "score": 4.984361556706754}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977516433487772, "4": 0.0022299718877047438, "3": 1.071388493767384e-05, "1": 0, "2": 0}, "score": 4.997748583072075}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.976161143648831, "4": 0.023622956658225145, "3": 0.00017018593216003416, "2": 1.8021018010488903e-07, "1": 0}, "score": 4.976035039637179}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6657762805259987, "5": 0.2577658407926778, "3": 0.07595977159151383, "2": 0.0004212740440765741, "1": 5.3884968311074906e-05}, "score": 4.180806015358516}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7617479517456095, "4": 0.23554321009495421, "3": 0.002699483015625295, "2": 5.180795199799823e-06, "1": 0}, "score": 4.7590412756424785}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7220987691996522, "4": 0.2591414311775428, "3": 0.0186296794618453, "2": 8.95911513602736e-05, "1": 0}, "score": 4.703318412233767}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.663050090744054, "4": 0.3242474889481986, "3": 0.012662973705480847, "2": 2.8372136600853278e-05, "1": 5.77526162241421e-06}, "score": 4.650316493140294}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5228473402361576, "5": 0.4622991207006689, "3": 0.014785829841432232, "2": 5.474981873770467e-05, "1": 0}, "score": 4.4474095893829375}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6665431235207057, "5": 0.31892398376553516, "3": 0.014448249696936534, "2": 6.640335338307188e-05, "1": 0}, "score": 4.30434847857565}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7307502740245652, "4": 0.2665671225793326, "3": 0.002670187191103429, "2": 4.760942048279461e-06, "1": 0}, "score": 4.728076138563654}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7399016773926638, "4": 0.2590442195506066, "3": 0.0010160765379858211, "2": 1.333983472470488e-06, "1": 0}, "score": 4.738910045370635}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8902179576519449, "4": 0.10915747659294736, "3": 0.000617237303136978, "2": 9.595571125776565e-07, "1": 0}, "score": 4.8896044670319}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.675957097628339, "4": 0.3187032691007708, "3": 0.005310804227093254, "2": 1.25282056953605e-05, "1": 0}, "score": 4.670632168856265}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8104350068330994, "3": 0.14023902370428903, "5": 0.0483703769076307, "2": 0.0009161793642123531, "1": 3.0032362732294027e-05}, "score": 3.9062080175402616}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.860695444608153, "3": 0.09896868420987467, "5": 0.03973318683755822, "2": 0.0005713046231119082, "1": 0}, "score": 3.9396199986738454}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6891893687091051, "5": 0.1557584919262384, "3": 0.15428249096977384, "2": 0.0007300748462266361, "1": 2.676134666944939e-05}, "score": 3.9999355663984666}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7488311161459764, "5": 0.21672103618528915, "3": 0.034357023929811284, "2": 6.828168380815821e-05, "1": 0}, "score": 4.182231556761658}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7347000340576845, "3": 0.21071922897422624, "5": 0.05351690466195217, "2": 0.000942818278148664, "1": 0}, "score": 3.8408927849264507}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7727863726297353, "4": 0.21433158511190292, "3": 0.01268545775829263, "2": 0.00016724679869101864, "1": 2.2117066669091856e-05}, "score": 4.759705555630356}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.794771561217194, "4": 0.1913675795790602, "3": 0.013429399268679008, "2": 0.00028196404363387754, "1": 0}, "score": 4.780894974451568}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8452128667805838, "4": 0.14879789547445468, "3": 0.005845752206717096, "2": 4.6524197703575655e-05, "1": 0}, "score": 4.839355451208199}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.962830134256466, "4": 0.03632944534500617, "3": 0.0008023788340235648, "2": 2.741259696405885e-06, "1": 0}, "score": 4.962056233781344}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9615947354478793, "4": 0.037877288293027965, "3": 0.00043977615462167713, "2": 1.2362610694437883e-06, "1": 0}, "score": 4.961236079555013}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"4": 0.550591105830098, "3": 0.39496651098171964, "5": 0.04213771062153165, "2": 0.011748140573247448, "1": 0.0005443625940297319}, "score": 3.6220372311313453}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7228160031600216, "3": 0.13992610739947667, "5": 0.1348189111383308, "2": 0.0022806159933132395, "1": 0.000149230420533851}, "score": 3.9898837881105096}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7501818238752219, "3": 0.2100038951717046, "5": 0.03833321217285968, "2": 0.00145096170147665, "1": 2.899831016059185e-05}, "score": 3.825340205010428}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6707737581686986, "4": 0.3221663022969723, "3": 0.007030767529207761, "2": 1.4338633789934133e-05, "1": 0}, "score": 4.663724158638818}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7320241747144273, "3": 0.19896421391535524, "5": 0.06648520082977885, "2": 0.002446029943423443, "1": 7.555558102763012e-05}, "score": 3.8624015963699962}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8123467239667067, "4": 0.18250585943168615, "3": 0.005090944019987103, "2": 3.3578922311347226e-05, "1": 1.8610474324885846e-05}, "score": 4.807136247792978}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5206235037576737, "5": 0.4054295121526569, "3": 0.07039693878015489, "2": 0.0029155881873428728, "1": 0.0006310803916326055}, "score": 4.3273092610580965}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8638440190354538, "4": 0.13286345928698037, "3": 0.003267216107315864, "2": 1.337727749069517e-05, "1": 5.76040945410979e-06}, "score": 4.86053807484322}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6473175054493769, "4": 0.3396852586360207, "3": 0.012848065804768815, "2": 0.00010904041114438185, "1": 2.295827775493299e-05}, "score": 4.634193373990433}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7834309274801378, "4": 0.20900765518681363, "3": 0.007397079639314991, "2": 0.00010837501331534, "1": 4.943924578939844e-05}, "score": 4.775673840134413}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6571854187464217, "5": 0.2138098735956184, "3": 0.12790374373860988, "2": 0.0010260733946966436, "1": 7.195072847088081e-05}, "score": 4.083638376761983}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6082716524543631, "5": 0.34906392757032395, "3": 0.04231089335335553, "2": 0.00029406256710053455, "1": 4.485739949058538e-05}, "score": 4.306034807029254}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.686754617727163, "5": 0.21751366561790447, "3": 0.09516543317706688, "2": 0.0005216190634470721, "1": 4.0586948847219065e-05}, "score": 4.121183727589879}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6138794534476814, "5": 0.3486057330865638, "3": 0.03725126779390621, "2": 0.00020484683590547657, "1": 3.0083401003442887e-05}, "score": 4.310863416909719}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5016577824630819, "4": 0.45635706436146317, "3": 0.04177331668943104, "2": 0.00017280807022394313, "1": 3.6041013647332365e-05}, "score": 4.459432099100703}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5363311990837473, "3": 0.40073081154450857, "5": 0.042246384618505835, "2": 0.01954398524480735, "1": 0.0011467768623450755}, "score": 3.5989869340852563}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7900634976333752, "3": 0.13060070029733628, "5": 0.07782327718015315, "2": 0.0014323569138268333, "1": 7.092709779885272e-05}, "score": 3.9441445656085388}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6774784736116495, "3": 0.18733764537602135, "5": 0.13212311522280143, "2": 0.0029209177912959167, "1": 0.0001333065759551192}, "score": 3.938543312522178}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6927939461557041, "5": 0.25215401689733385, "3": 0.05470818206649359, "2": 0.00024891527013262774, "1": 0}, "score": 4.196966704232723}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.48610392037863526, "5": 0.44320750944456283, "3": 0.06967870023191484, "2": 0.0008981791595861915, "1": 8.938470280405925e-05}, "score": 4.3714725828831416}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6235847044011419, "5": 0.3422310449448668, "3": 0.033887142968513126, "2": 0.00010048661735284712, "1": 0}, "score": 4.308203528048532}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4938092154166775, "5": 0.4719731880447418, "3": 0.03396849505396082, "2": 0.00011476040933256344, "1": 0}, "score": 4.4378339912613}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7294577712108795, "4": 0.26241829566755914, "3": 0.008073458709341105, "2": 2.0377769126967256e-05, "1": 0}, "score": 4.721365267636283}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8830945287774162, "4": 0.11526727693624395, "3": 0.0016141150970465767, "2": 2.7040173050701113e-06, "1": 0}, "score": 4.881493847728361}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.784604170322248, "4": 0.20999329024277513, "3": 0.005347957856548623, "2": 1.167420325991604e-05, "1": 0}, "score": 4.779266300330685}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5188908272825963, "5": 0.47175311107577633, "3": 0.009316409232547864, "2": 3.11998896504389e-05, "1": 0}, "score": 4.462378210324735}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5713909086329001, "5": 0.39336004164835053, "3": 0.034776712403938266, "2": 0.0004222014450031056, "1": 3.7241232871290744e-05}, "score": 4.357631814188192}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7224422015862811, "5": 0.22275706410061388, "3": 0.054433424110454355, "2": 0.0003333485228961557, "1": 2.1149379308890456e-05}, "score": 4.16759564209216}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5424159697689606, "4": 0.450423724164154, "3": 0.007131141209003505, "2": 2.2591812411573393e-05, "1": 0}, "score": 4.535243163112782}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.584329548460244, "5": 0.37957979148665255, "3": 0.03594377021844449, "2": 0.00011261952003010193, "1": 0}, "score": 4.343422551427036}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9271185091514468, "4": 0.07077939158232291, "3": 0.0020835994001175565, "2": 1.1814783165139391e-05, "1": 3.6937254580382424e-06}, "score": 4.9250029660231744}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5916300825276871, "4": 0.3936102903357833, "3": 0.014629123161867395, "2": 0.00010134895458685759, "1": 0}, "score": 4.5768150785118396}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.902178179661749, "4": 0.0962629951868141, "3": 0.0015226707707103923, "2": 4.586469509034218e-06, "1": 0}, "score": 4.900674768373144}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.964588279551578, "4": 0.035124408195389555, "3": 0.0002858366683395848, "2": 1.0156375648095985e-06, "1": 1.9636375596219958e-07}, "score": 4.964300076690307}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9230661856072538, "4": 0.07537263506618597, "3": 0.0015458544182058503, "2": 8.866849595376923e-06, "1": 0}, "score": 4.921508548646211}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7316668291998315, "3": 0.2008064038479568, "5": 0.059744687754352634, "2": 0.007203530686707008, "1": 0.0005597244214006519}, "score": 3.8428490910459656}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.85871151636371, "3": 0.10986475166505, "5": 0.030508690546636984, "2": 0.0008734232475210384, "1": 0}, "score": 3.9188937168908926}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8072400542115136, "5": 0.13337390224293694, "3": 0.0588212555766675, "2": 0.0004852159055506504, "1": 0}, "score": 4.073588070409768}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7933588560584264, "5": 0.15667639173005754, "3": 0.04903763570884386, "2": 0.0008788086276207665, "1": 4.1290215454518646e-05}, "score": 4.105758010293324}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7973109386114067, "3": 0.16183284458427472, "5": 0.03837347167217902, "2": 0.002360893806683015, "1": 8.578005823396361e-05}, "score": 3.871556866193234}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6650370337681428, "5": 0.22091050814396154, "3": 0.11244505237370969, "2": 0.0014837945310331687, "1": 7.870790207665781e-05}, "score": 4.105266469811837}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4641795548270794, "4": 0.4035401063713845, "2": 0.1021812787988239, "5": 0.02300029355209201, "1": 0.007076590889666312}, "score": 3.3332136220963995}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6508135521642273, "4": 0.329310896585501, "3": 0.019659840052063518, "2": 0.0001718653906589123, "1": 0}, "score": 4.630837640916645}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6567516421505813, "5": 0.24981358481578336, "3": 0.09221067262194373, "2": 0.0011020848222773277, "1": 7.264158528877694e-05}, "score": 4.155188480070073}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6021420488277281, "3": 0.346982199021849, "5": 0.03333967332492781, "2": 0.016949753297184105, "1": 0.0005785260396407539}, "score": 3.6507196653817764}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4116696959632753, "1": 0.37257002956495305, "3": 0.17628998460714854, "4": 0.027679436668812667, "5": 0.011767874032271749}, "score": 1.8943800234179213}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.34783766080101136, "3": 0.25223156618012094, "1": 0.20607440213254224, "4": 0.10747510925911816, "5": 0.08636823683403733}, "score": 2.5202188688110962}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3688700370854948, "4": 0.327689554164484, "5": 0.1438571335523032, "2": 0.12675844645916767, "1": 0.0327945741346491}, "score": 3.4230690263264387}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7640418147233766, "4": 0.16323335111629603, "3": 0.055322299821110234, "1": 0.009177926236797569, "2": 0.008168279335018644}, "score": 4.664886629766153}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5791036510924621, "4": 0.3142975909558712, "3": 0.09267152752774177, "2": 0.00977805685753084, "1": 0.004114845463472364}, "score": 4.454547077198091}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6058352769967429, "5": 0.319009275441783, "3": 0.0721929271350774, "2": 0.002477960341848262, "1": 0.00047279262053485384}, "score": 4.2404448791878675}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5043339909147756, "4": 0.48087734567053736, "3": 0.014638424388165662, "2": 0.00011647673552087794, "1": 2.3370780791036495e-05}, "score": 4.48939758629321}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4952184503130441, "4": 0.4896058496700018, "3": 0.015104161154180824, "2": 4.834341692194041e-05, "1": 0}, "score": 4.480028736805592}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5661638245452201, "5": 0.33840993260878977, "3": 0.09406737482497846, "2": 0.0011024080009228933, "1": 0.00022870353502847792}, "score": 4.241458333211499}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6627762678301109, "5": 0.29506036985579265, "3": 0.04143576011883472, "2": 0.0006358352939117624, "1": 8.931429540240915e-05}, "score": 4.252085614529605}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5860211897945058, "4": 0.3889472922676274, "3": 0.02478492930112627, "2": 0.00019332748375293303, "1": 2.704498411487739e-05}, "score": 4.560783172159872}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9796907679694187, "4": 0.020088284390377298, "3": 0.00021137050848655723, "2": 5.374269463226712e-07, "1": 0}, "score": 4.979487176881945}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9765031850214607, "4": 0.02312814973735716, "3": 0.0003098082500781199, "2": 8.209735047000975e-07, "1": 0}, "score": 4.976248392393255}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9893855520838208, "4": 0.010537046429967632, "3": 5.128839754915444e-05, "1": 0, "2": 0}, "score": 4.989360098934253}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9924802383513751, "4": 0.007468654623553812, "3": 3.626926026890501e-05, "1": 0, "2": 0}, "score": 4.992458694959797}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6626722466309095, "3": 0.2912169083373441, "5": 0.031596213232011665, "2": 0.014269859405423309, "1": 0.00024435658147215893}, "score": 3.711106396213735}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7830470072431931, "3": 0.14517994586608185, "5": 0.06853263663175302, "2": 0.0031844617485024987, "1": 5.5236698372007655e-05}, "score": 3.9168179979635944}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7173456617943292, "5": 0.23523360376795255, "3": 0.047062785831292024, "2": 0.00034294708288620335, "1": 1.3445097721888264e-05}, "score": 4.187444880221774}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.49942410219314515, "4": 0.48416554288042823, "3": 0.016335036491272673, "2": 6.981553559272208e-05, "1": 4.151424622913124e-06}, "score": 4.482937633034927}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7405299725471765, "5": 0.19411397353043505, "3": 0.06467198304047687, "2": 0.000665301391287747, "1": 1.8404893088118716e-05}, "score": 4.128056219717101}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6913875905147415, "3": 0.17472415601370844, "5": 0.13123276505493323, "2": 0.0025653406555409593, "1": 6.529729152199933e-05}, "score": 3.9511808226760965}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5276679899345587, "3": 0.43963862339322635, "5": 0.030164284105247276, "2": 0.0025146528921628, "1": 1.2159144956206313e-05}, "score": 3.585458927974128}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5419095355785118, "4": 0.44921595412345033, "3": 0.008833340706149363, "2": 2.8331848426270784e-05, "1": 0}, "score": 4.533026374031358}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7032441571505315, "3": 0.18004740529784619, "5": 0.11441626884085616, "2": 0.00219123580453428, "1": 5.1447509658225e-05}, "score": 3.929828576944268}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.530399756074657, "3": 0.43158223812565694, "5": 0.03205948485767012, "2": 0.005876630650100186, "1": 6.256146778287308e-05}, "score": 3.5885283477652634}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6230910270706626, "3": 0.22337497889163194, "1": 0.12416621095480647, "4": 0.02757479908494084, "5": 0.001789339538717856}, "score": 2.159726966841281}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7797070396831141, "1": 0.16043278647176915, "3": 0.05729841597837574, "4": 0.0024799851666813715, "5": 7.554077358492543e-05}, "score": 1.90205161175357}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5424663625532608, "2": 0.2445133916481603, "4": 0.16274252960361513, "1": 0.0420296482089059, "5": 0.008240563924196512}, "score": 2.850649848653261}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4806925511700375, "4": 0.44807184102166076, "2": 0.04626037110748186, "5": 0.022431837775277803, "1": 0.0025206688399397855}, "score": 3.441643846387289}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6431854516992329, "3": 0.20374521740409382, "1": 0.12688865618787357, "4": 0.0245485251967065, "5": 0.0016279077135779299}, "score": 2.1308378897383333}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5808754017199257, "5": 0.3867752515496478, "3": 0.03214278725899479, "2": 0.00016367545888594875, "1": 2.7670712903641344e-05}, "score": 4.354227490203121}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7096894634825321, "4": 0.281969914473385, "3": 0.008292257755922218, "2": 3.513137331779058e-05, "1": 7.498294224672457e-06}, "score": 4.701308469835311}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5976122779158507, "5": 0.31812522003993304, "3": 0.08358011884769918, "2": 0.0005582581880490149, "1": 0.00010371705411314972}, "score": 4.233122191200834}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5205603247230391, "5": 0.4477080379594122, "3": 0.03156453496141151, "2": 0.00014425947069498173, "1": 1.695765845375995e-05}, "score": 4.415806558197227}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7945929087047048, "3": 0.10371270026817349, "5": 0.09968666123320008, "2": 0.0017303458104748375, "1": 0.0002729316937854879}, "score": 3.9916944372839493}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9736254816933227, "4": 0.02602981154284873, "3": 0.0002804475045697866, "2": 1.2192044525436348e-06, "1": 0}, "score": 4.973403959218785}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9926773148668234, "4": 0.007262493876292413, "3": 3.346531595833301e-05, "2": 3.913713799130119e-08, "1": 0}, "score": 4.992670262473109}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.971967720923079, "4": 0.027843715315370016, "3": 0.0001753120551007872, "2": 5.18701636806626e-07, "1": 0}, "score": 4.971803745446474}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972468249571347, "4": 0.0027236464224021572, "3": 2.1625097424008846e-05, "1": 0, "2": 0}, "score": 4.997233081514347}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9854825226961934, "4": 0.014252342497327077, "3": 0.00011225875935987729, "2": 1.6512765425774234e-07, "1": 0}, "score": 4.985520433413064}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4938543368260303, "4": 0.488422973286835, "3": 0.017486677039961842, "2": 8.277172834395787e-05, "1": 0}, "score": 4.476275101258768}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8053536912862517, "4": 0.19223851736508363, "3": 0.0023436845358647835, "2": 6.129048746954358e-06, "1": 0}, "score": 4.803044307366269}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9768416020024266, "4": 0.022751766232621387, "3": 0.00036146982192581707, "2": 1.0908427448990006e-06, "1": 0}, "score": 4.976520986849349}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.985659108404314, "4": 0.014238268136818697, "3": 8.262130342304252e-05, "2": 1.3723843807443188e-07, "1": 0}, "score": 4.985595791402612}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9194286081369202, "4": 0.07914786239751805, "3": 0.0014120439702390653, "2": 5.329124991293681e-06, "1": 0}, "score": 4.918011557535815}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5026302845087618, "4": 0.4921964074577053, "3": 0.005118358995479602, "2": 3.0060967155160094e-05, "1": 0}, "score": 4.497464184502865}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6687798140557839, "4": 0.3297038340720907, "3": 0.0015099591220678321, "2": 4.3267754203423055e-06, "1": 0}, "score": 4.6672625799304415}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8696083944416159, "4": 0.1295400732195737, "3": 0.0008419684624045242, "2": 4.546494779622782e-06, "1": 0}, "score": 4.8687616918986025}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5531010298629291, "4": 0.4410631131748149, "3": 0.0057940334873018366, "2": 3.4058872044452205e-05, "1": 0}, "score": 4.547243127757121}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5161028921434533, "4": 0.48197554631733563, "3": 0.0018646628867496505, "2": 4.37129173938075e-06, "1": 0}, "score": 4.514256499209863}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7123361202226379, "3": 0.23843894434033214, "5": 0.03578188926613499, "2": 0.01176325840070422, "1": 0.0016665594288103789}, "score": 3.768813691626554}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8198187743825499, "3": 0.09581392975833701, "5": 0.08333037086832515, "2": 0.0009595136657919179, "1": 7.48379087420482e-05}, "score": 3.9853728624104643}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7712368300643053, "5": 0.18864604453614148, "3": 0.03979658398093767, "2": 0.00027848356859398943, "1": 3.905814986988322e-05}, "score": 4.148175763451267}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7403659040936746, "5": 0.1595434468190282, "3": 0.09907865988874869, "2": 0.0009112898905150718, "1": 9.304121415702185e-05}, "score": 4.0583635304601735}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7597271297307134, "5": 0.14363995829043405, "3": 0.09472389381524757, "2": 0.001642324602857754, "1": 0.0002616271916936357}, "score": 4.0448467609046315}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4398376488702421, "2": 0.25103005650188326, "4": 0.16455482197684354, "1": 0.1301974154524911, "5": 0.014225658618091136}, "score": 2.681532080811519}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6709919896568293, "5": 0.2869478462841298, "3": 0.041351846629371886, "2": 0.0005700961084689151, "1": 0.00010486329588756933}, "score": 4.244149361890752}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5133159687115584, "3": 0.42101982758808654, "5": 0.03354497846301951, "2": 0.029585500075146536, "1": 0.0025115630263161533}, "score": 3.545809395811809}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.45682604777112895, "5": 0.4192151526667, "3": 0.11442488471028327, "2": 0.007427239675347977, "1": 0.002103020572196711}, "score": 4.283627763436387}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5420465476266993, "3": 0.30199947500585106, "5": 0.12044691048763864, "2": 0.030219638031164377, "1": 0.0052468604016314355}, "score": 3.7422571219862744}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6226878992530698, "4": 0.22114711946654425, "2": 0.12221339779469699, "1": 0.02046157381219094, "5": 0.013370890309440546}, "score": 3.084762451515667}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5095145343670177, "2": 0.3026822510866933, "3": 0.17446415044876804, "4": 0.01147892308979572, "5": 0.001831479809189004}, "score": 1.6933931139680758}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5591589495513853, "4": 0.18745705496350926, "2": 0.15205423691080516, "1": 0.08352251857086235, "5": 0.017780729864357577}, "score": 2.9039166934578753}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4300828562083562, "3": 0.3349859125938285, "5": 0.20790467450071834, "2": 0.02047785337455368, "1": 0.00646003204935157}, "score": 3.8125663390283706}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3383321411077587, "3": 0.30877022102072516, "1": 0.30658246682746376, "4": 0.043838888071351154, "5": 0.0024747027281837334}, "score": 2.097289792262176}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"3": 0.48608513282518445, "4": 0.2544116129931638, "2": 0.21067097979553295, "1": 0.036945268175178986, "5": 0.011872960395281927}, "score": 2.9935959276874176}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7532473794265114, "5": 0.1344519759276529, "3": 0.10518451345698374, "2": 0.006565900590873897, "1": 0.0005489613607934522}, "score": 4.014488795596259}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7420035139828702, "3": 0.1642674149738263, "5": 0.08287658545337283, "2": 0.01015304518768252, "1": 0.000693598496622202}, "score": 3.8962216783511536}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7409844567143842, "5": 0.13192548808255963, "3": 0.11928709838814522, "2": 0.007177041702325129, "1": 0.0006225618357628293}, "score": 3.996416608766373}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6001302583969232, "3": 0.2933986835973264, "5": 0.05230773615586412, "2": 0.0499516220970221, "1": 0.0042082642856235844}, "score": 3.6463798006570123}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8860341102186615, "4": 0.10367440623939209, "3": 0.009689536374431608, "2": 9.345897387950677e-05, "1": 0}, "score": 4.876603398375046}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9094125203336489, "4": 0.08064509456543012, "3": 0.009587692828507619, "2": 0.00021157754154050958, "1": 0.00010909145399989393}, "score": 4.899104988558025}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5134539152446379, "4": 0.41092572441602604, "3": 0.0743616148288784, "2": 0.0009718850712008255, "1": 0.00019132213115446414}, "score": 4.436616277460333}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9388113971061265, "4": 0.06017209333566319, "3": 0.0009658398734171549, "2": 3.2391552093921054e-06, "1": 0}, "score": 4.937883563236382}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6560563594058442, "4": 0.3218619989472803, "3": 0.02161620098140732, "2": 0.00016096558074941937, "1": 0}, "score": 4.634311359267789}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7526502157664394, "5": 0.2070417945620916, "3": 0.040040845835320006, "2": 0.00022454082921285077, "1": 0}, "score": 4.166558962981001}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8633999964261801, "4": 0.133329642790045, "3": 0.0032428574786553194, "2": 2.4091029660824625e-05, "1": 2.047215460719202e-06}, "score": 4.8601039893353715}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9092924494317195, "4": 0.088463043655062, "3": 0.00222762629975499, "2": 1.485630802621772e-05, "1": 1.0627379587998736e-06}, "score": 4.907032794475273}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5839436736703727, "4": 0.41107204001654973, "3": 0.00496515382545589, "2": 1.0934189788458807e-05, "1": 0}, "score": 4.5789613979633135}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.508671222206972, "5": 0.48152674698157555, "3": 0.009746337554275267, "2": 3.843119724333144e-05, "1": 0}, "score": 4.471711689748274}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6611027400289041, "4": 0.2375006544339189, "3": 0.059618866678226315, "1": 0.02689776180798846, "2": 0.014800904281163306}, "score": 4.491227622093066}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9818821647407698, "4": 0.0162622631407463, "3": 0.0015013073256803047, "1": 0.0002320780083330593, "2": 0}, "score": 4.979804342532114}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.5229100752234358, "5": 0.29418772352985945, "4": 0.07108745495536438, "3": 0.06323638066594266, "2": 0.04833967630227051}, "score": 2.565199292979487}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9613525162059738, "4": 0.03571132191495586, "3": 0.0027749570760318546, "1": 7.818646556566585e-05, "2": 7.1537626637873e-05}, "score": 4.958210925422523}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.907688391906987, "4": 0.09051671945323157, "3": 0.001669460097057124, "2": 8.990932396580246e-06, "1": 0}, "score": 4.906106454815438}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8481810361069034, "4": 0.14661621332153257, "3": 0.005187985538615106, "2": 1.2161236509007177e-05, "1": 1.4672935156238446e-06}, "score": 4.842965284247233}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9285457652116691, "4": 0.07097033543661178, "3": 0.0004802050777467002, "2": 3.387169615461425e-07, "1": 0}, "score": 4.928067996885072}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8778821323270027, "4": 0.12066743360525731, "3": 0.0014465198657137171, "2": 2.551610065006635e-06, "1": 0}, "score": 4.876431703459953}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7462533911731666, "4": 0.24543108106960299, "3": 0.008284276155460707, "2": 2.4915561247364387e-05, "1": 5.292721410744855e-06}, "score": 4.737904175600509}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.864605504708368, "4": 0.13324816328615513, "3": 0.002138373041659576, "2": 3.953718616548164e-06, "1": 0}, "score": 4.86246267860398}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7324363031712341, "3": 0.1328219193783645, "1": 0.11928765903882521, "4": 0.01442466053452593, "5": 0.0010281425029598189}, "score": 2.04546806872499}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5346185911865095, "4": 0.2823385489246633, "2": 0.1519144721082477, "5": 0.023143423983287552, "1": 0.007984191937451302}, "score": 3.160742664978896}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5524632575353832, "5": 0.3417040388703358, "3": 0.10181798709021636, "2": 0.0032754434974321626, "1": 0.0006658402373896034}, "score": 4.231354633084471}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.44441754135487166, "4": 0.28665198351815574, "3": 0.18742241610048152, "2": 0.061205421915346774, "1": 0.020260315656532996}, "score": 4.073806458050763}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4902971221067689, "1": 0.3970971173999848, "3": 0.09444123403333247, "4": 0.01451727441022733, "5": 0.003639643651737904}, "score": 1.73729559764938}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7246346950562347, "4": 0.2698563766085724, "3": 0.005475083786096758, "2": 1.5495080058603925e-05, "1": 0}, "score": 4.7191418169805255}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.717530782377747, "4": 0.27583086750442054, "3": 0.006546259245737419, "2": 4.194774000677097e-05, "1": 0}, "score": 4.710936276223602}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9141044190647545, "4": 0.0848438475206355, "3": 0.0010366053407932635, "2": 3.825801768391747e-06, "1": 0}, "score": 4.913070481891411}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9771975546563643, "4": 0.022607587476491196, "3": 0.00018598602899542744, "2": 3.1861001677274956e-07, "1": 0}, "score": 4.977019288076196}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.703357508145484, "4": 0.2896136168691984, "3": 0.006949952875027552, "2": 1.696697076424639e-05, "1": 0}, "score": 4.696416767926954}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5326612555060835, "5": 0.42699752586391776, "3": 0.03956966458967224, "2": 0.0005934113637826301, "1": 0.0001079507989412798}, "score": 4.38594427630326}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.923259514370592, "4": 0.0754937505745592, "3": 0.001232579686224367, "2": 7.359239200969272e-06, "1": 3.5253141679920337e-06}, "score": 4.922004655970356}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9746181165913641, "4": 0.025159387289752064, "3": 0.00021746894483450508, "2": 1.3499081565681102e-06, "1": 0}, "score": 4.97440153096373}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961277545526345, "4": 0.003767769866133999, "3": 5.502769246948142e-05, "2": 2.2974783477971665e-07, "1": 0}, "score": 4.996121294602753}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9718348464673844, "4": 0.027296958315860643, "3": 0.0007207714220503793, "2": 5.056373657867993e-06, "1": 0}, "score": 4.971242235550305}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4361991560474286, "4": 0.2693605667688694, "2": 0.24473034676974045, "1": 0.02953958649839693, "5": 0.020169931967027793}, "score": 3.0058909133631437}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4142157523340835, "3": 0.3429073448297587, "5": 0.11351103751053358, "2": 0.10429957414140469, "1": 0.025065246346714674}, "score": 3.4868082691558535}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5241382204290626, "2": 0.2610049255495913, "4": 0.17540229758737522, "1": 0.02891871545104925, "5": 0.010535334299037167}, "score": 2.87763054773113}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6162050114637974, "5": 0.23682170986535872, "3": 0.13713145330737847, "2": 0.008692723348679378, "1": 0.0011478593569012026}, "score": 4.078861329787571}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6431095152759457, "1": 0.2656041862554809, "3": 0.08240409060782926, "4": 0.008205431220512054, "5": 0.0006767028521111586}, "score": 1.8352408631924386}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5330291104920087, "4": 0.32515870264792857, "3": 0.10386433526565865, "2": 0.019863468263256977, "1": 0.018033744169766972}, "score": 4.335353588215008}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.573204289287767, "5": 0.36252907536516, "3": 0.060986765339253006, "2": 0.002740569591710325, "1": 0.0005000982394207611}, "score": 4.294572424004438}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8347318946010543, "4": 0.15479792845340473, "3": 0.010078810794851028, "2": 0.00030179728732228383, "1": 7.303578729682103e-05}, "score": 4.823844002545233}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8315783146481147, "4": 0.1600000421997352, "3": 0.008147378988138896, "2": 0.00018096733727988236, "1": 5.0879320193422386e-05}, "score": 4.822951270565737}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5655931927054773, "5": 0.37755904950348396, "3": 0.05409209078652161, "2": 0.0023589782467153147, "1": 0.00037193836607949695}, "score": 4.317641048865681}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6697944933436738, "3": 0.2615888192977395, "5": 0.06005600112373401, "2": 0.007939658616900509, "1": 0.0006065314354550091}, "score": 3.7807650922165963}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7757203014868147, "4": 0.22230270274249445, "3": 0.0019619762949432554, "2": 2.7948838739558622e-06, "1": 0}, "score": 4.773762194351157}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6884609706013277, "3": 0.2931072781342189, "5": 0.014952466641690972, "2": 0.0033914985673565634, "1": 6.563365237690877e-05}, "score": 3.7148589738566975}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6113796709978077, "5": 0.3749255147777748, "3": 0.01363567989465486, "2": 5.1098572324504986e-05, "1": 0}, "score": 4.361190540178041}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6680651501744365, "5": 0.3097962982217208, "3": 0.022082182883112682, "2": 4.875450278330687e-05, "1": 0}, "score": 4.287618796325242}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8318083859781447, "5": 0.13940634014758244, "3": 0.028694586434049155, "2": 7.542845250144175e-05, "1": 7.71538631630245e-06}, "score": 4.110538584508603}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7486091954934162, "5": 0.1818117987008537, "3": 0.06925005774861628, "2": 0.00030432145422923233, "1": 1.9663331536446887e-05}, "score": 4.1118946634127465}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6100586554268835, "5": 0.36904942530326773, "3": 0.020832737735761567, "2": 4.621791798001036e-05, "1": 0}, "score": 4.348128764739209}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7151856640475316, "4": 0.28052944114739414, "3": 0.004078406216882875, "2": 5.6461142091939005e-06, "1": 0}, "score": 4.711238812564938}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8553442410195466, "4": 0.14339894613097545, "3": 0.0011752093230215136, "2": 6.361165726956224e-07, "1": 0}, "score": 4.854236924814609}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7893424830592161, "3": 0.1252107451646507, "5": 0.08355898410824306, "2": 0.0017799820482176194, "1": 0}, "score": 3.9547834002436013}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6892752677328138, "4": 0.24574899733095257, "2": 0.060764514711949665, "5": 0.002964974046082303, "1": 0.0012413621428238833}, "score": 3.1884326267371357}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5966596671009395, "3": 0.385769206098378, "2": 0.010634163380967575, "5": 0.0067175350484772415, "1": 0.00019917574146972316}, "score": 3.5990743551651048}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6415050261250047, "3": 0.3189922089020808, "5": 0.028230204293252747, "2": 0.011077270198434585, "1": 0.00019113491844363875}, "score": 3.6865087475063896}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6581250895668022, "4": 0.2186779017656998, "2": 0.11847703910599487, "1": 0.0026018391984854315, "5": 0.0021120716257622347}, "score": 3.0992219286738543}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5036862120210344, "5": 0.45927328680968227, "3": 0.03660275749570988, "2": 0.0004013562985901702, "1": 2.3027474763808594e-05}, "score": 4.4218043695567895}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5644248674493766, "5": 0.41496647298621, "3": 0.02043227950537776, "2": 4.9264293948431833e-05, "1": 0}, "score": 4.394485810258523}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8483057363668896, "4": 0.14818981398907233, "3": 0.0034850774890337003, "2": 1.3442274547810331e-05, "1": 3.957064877766675e-06}, "score": 4.844783569736315}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8925474780933412, "4": 0.10575550559995794, "3": 0.0016801570630939598, "2": 7.105943581180785e-06, "1": 0}, "score": 4.890861797985481}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5304368535308798, "5": 0.4660331546825035, "3": 0.003518390282768852, "2": 5.992798857249481e-06, "1": 0}, "score": 4.462505372858214}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4896331067863477, "5": 0.3506412001977461, "3": 0.1425832556080347, "2": 0.012049838760576722, "1": 0.00508171030419299}, "score": 4.168714973182493}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5429240499552795, "5": 0.33361928547220787, "3": 0.11030212359575405, "2": 0.008770629468273871, "1": 0.00436842389364378}, "score": 4.192673615313718}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8066124108809584, "4": 0.1623599654191811, "3": 0.028364367132955527, "1": 0.0013643201950575736, "2": 0.0012924667205977823}, "score": 4.771575141543713}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6033396643787434, "4": 0.34891323430341686, "3": 0.04330002788406988, "2": 0.0026169483289812264, "1": 0.0018210518596074}, "score": 4.5493475686230695}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9759769233082062, "4": 0.02342397051396316, "3": 0.0005805692907727647, "2": 8.759357503982788e-06, "1": 6.733685106838479e-06}, "score": 4.975361603096103}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5013629445288746, "3": 0.4482562784562026, "5": 0.02520010292872214, "2": 0.024459274740519774, "1": 0.0007167711108925599}, "score": 3.52587276728665}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6690425289150077, "5": 0.1943433186891137, "3": 0.133110256226775, "2": 0.003075860436860161, "1": 0.00031681200632151067}, "score": 4.054136926880371}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.808698737523533, "5": 0.1119281087438302, "3": 0.0782631040253177, "2": 0.0009355948759707081, "1": 0}, "score": 4.0317993625189965}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.456466589507047, "3": 0.44047589368303214, "5": 0.07498490892691062, "2": 0.025215199790670214, "1": 0.002818763402379935}, "score": 3.5756059248779444}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.593061426111959, "3": 0.331523162500752, "5": 0.06554478693533615, "2": 0.009466500267635666, "1": 0.00037514250156643673}, "score": 3.713954906326456}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"4": 0.829601204635508, "5": 0.09695832810027806, "3": 0.07291934585013267, "2": 0.0004947299993843013, "1": 1.4295925376606544e-05}, "score": 4.023006912755114}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5348741999587262, "5": 0.4597643055726319, "3": 0.005320824534233774, "2": 1.875924238118357e-05, "1": 0}, "score": 4.454415919120891}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8141542619007037, "5": 0.10370056659207601, "3": 0.08132070669192297, "2": 0.0007908367466946474, "1": 2.5772590873373372e-05}, "score": 4.020721031407745}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6727651702631525, "5": 0.30855881670002167, "3": 0.01859519062957403, "2": 6.827956710876918e-05, "1": 0}, "score": 4.289830702236396}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8749790462973513, "5": 0.0728463391129235, "3": 0.051876768990033864, "2": 0.0002856920715714726, "1": 0}, "score": 4.020398433892686}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6867985027493473, "3": 0.2081657170301133, "5": 0.10337668767663351, "2": 0.001552011418449166, "1": 0.00010524948273980879}, "score": 3.891791001161177}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6892705255352849, "5": 0.21141790751084638, "3": 0.09843067359236113, "2": 0.0008041349939150524, "1": 6.537726434020246e-05}, "score": 4.111184097535329}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.665249134593029, "5": 0.25541604866120315, "3": 0.07887588010168506, "2": 0.0004074529875150462, "1": 4.345120385336437e-05}, "score": 4.17559631944206}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5024954770424309, "4": 0.47890688262477543, "3": 0.018545594711348173, "2": 4.086294074178546e-05, "1": 6.632757020553046e-06}, "score": 4.483850459661203}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6006314683201635, "5": 0.3416868515894444, "3": 0.057404085628086694, "2": 0.00025191017056849313, "1": 2.4737159788382386e-05}, "score": 4.2837050028469275}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.45042753476497926, "4": 0.3272123926904404, "2": 0.15071440359208668, "5": 0.04373358222657553, "1": 0.027898883747650087}, "score": 3.2081701345219673}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6613763741785198, "3": 0.2307082162505255, "5": 0.10077205438767478, "2": 0.006642822702682495, "1": 0.00046235341120343256}, "score": 3.855385611255391}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4999573420997726, "4": 0.43712147398850787, "2": 0.03621284821697018, "5": 0.025369135034006347, "1": 0.0013277161410298855}, "score": 3.4489966200680247}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.45815253704513914, "3": 0.4516624816946828, "2": 0.05109264630775152, "5": 0.03698473570400053, "1": 0.0020931691955781632}, "score": 3.4768499047235575}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5085968904261142, "4": 0.4341191688365203, "2": 0.03190678805932303, "5": 0.024385148500715825, "1": 0.0009847672885342908}, "score": 3.449016392683261}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.45042753476497926, "4": 0.3272123926904404, "2": 0.15071440359208668, "5": 0.04373358222657553, "1": 0.027898883747650087}, "score": 3.2081701345219673}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.48845142963818416, "3": 0.4519884918422618, "5": 0.03743885163444739, "2": 0.021223411299966206, "1": 0.0008878879547645923}, "score": 3.54033530994682}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.645559613835494, "3": 0.28175958700614245, "5": 0.05913304936242979, "2": 0.013151453423027423, "1": 0.00039212131069103263}, "score": 3.7498931473664894}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5276365946231774, "2": 0.25279992838415527, "4": 0.200845102970519, "1": 0.010971360415851363, "5": 0.0077437075069607866}, "score": 2.941589675658248}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5076236613822921, "4": 0.4687682636515, "2": 0.01318388537636352, "5": 0.010211449379749772, "1": 0.00020293476200625973}, "score": 3.475606071041263}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6775395510490697, "4": 0.32018622478624903, "3": 0.002262947753207588, "2": 3.891976234121447e-06, "1": 0}, "score": 4.6752738058590815}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8411017831454515, "4": 0.15825554168885875, "3": 0.0006330445874443804, "2": 1.2914667112552014e-06, "1": 0}, "score": 4.840473164424044}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7776385277964399, "4": 0.22145415191925458, "3": 0.0009028720580708107, "2": 1.7122333276775836e-06, "1": 0}, "score": 4.776734356411403}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7806403457569377, "4": 0.21632001863110978, "3": 0.0030107363367166615, "2": 2.1330768437351637e-05, "1": 3.3101137619391598e-06}, "score": 4.777580328784718}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5670715118585096, "5": 0.423975545975291, "3": 0.008922028035431092, "2": 2.5648973670347e-05, "1": 0}, "score": 4.415004405055908}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7446050763602096, "2": 0.18935682138737925, "3": 0.05751027796125157, "4": 0.007253936441611271, "5": 0.0012698696773968438}, "score": 1.3312199962432687}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7846538530312508, "2": 0.20017423834026607, "3": 0.013941071659868314, "4": 0.0011021919501283822, "5": 0.00012832942081053239}, "score": 1.2318763483732666}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.7570575535250703, "2": 0.22866576113116366, "3": 0.013254966057184882, "4": 0.0009198796607585779, "5": 0.00010155835485586379}, "score": 1.258341638311235}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9374538022047697, "2": 0.05912669290128921, "3": 0.0031716510205631924, "4": 0.00019036276818030216, "5": 5.736610123002084e-05}, "score": 1.066270555935959}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.992661449627689, "2": 0.007002645309194788, "3": 0.00032524981804598295, "4": 5.9328461633849765e-06, "5": 4.512920739415918e-06}, "score": 1.0076889967774116}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7310295178148034, "3": 0.21783743617261464, "5": 0.04636893723861644, "2": 0.004632878026518781, "1": 0.0001038608017553604}, "score": 3.8189492072573334}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.545526770365121, "3": 0.42743164419928825, "5": 0.016710577112789126, "2": 0.010120486936757331, "1": 0.00019911798887922738}, "score": 3.568435683774048}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5501264599516535, "4": 0.41887671442732655, "2": 0.02257902728043723, "5": 0.008139053364645384, "1": 0.00026944695889257744}, "score": 3.412040731120136}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6201839632715892, "4": 0.2309665232403171, "2": 0.1365250861396458, "5": 0.0066218665008792865, "1": 0.005694573927901751}, "score": 3.0962967913613633}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6330195580005679, "4": 0.18960420711164247, "2": 0.17049258038652904, "1": 0.0045785496560086575, "5": 0.002300694143633929}, "score": 3.014555979902448}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7214876990841255, "4": 0.2720341960000205, "3": 0.0064146278183636815, "2": 2.890589512741918e-05, "1": 0}, "score": 4.715039979267328}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5164247464859043, "5": 0.45435799337752175, "3": 0.02891507481395688, "2": 0.000226484963852936, "1": 0}, "score": 4.42502212296305}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5827407932440979, "5": 0.3948289562555591, "3": 0.022299719033278247, "2": 0.0001070208374434576, "1": 1.2800068954281129e-05}, "score": 4.372280782676439}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8073569025930736, "4": 0.186699071811021, "3": 0.005863327522191118, "2": 2.5562528736388216e-05, "1": 0}, "score": 4.801486640416121}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.554131475496549, "5": 0.4204833063001967, "3": 0.023183487486338934, "2": 0.0009763841037959563, "1": 0}, "score": 4.395832082107441}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6167077192727691, "3": 0.3573140471514485, "5": 0.013481993482140674, "2": 0.012065972235726339, "1": 0.0004127362866767688}, "score": 3.6307913201909368}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5659574727986384, "3": 0.3884249137712413, "2": 0.02902682141647985, "5": 0.015682105401795574, "1": 0.0008947363178722666}, "score": 3.5665132925769756}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7330244878100219, "3": 0.2003679204860709, "5": 0.05986238107209209, "2": 0.006505859803267497, "1": 0.0002314849956836556}, "score": 3.8457870729793258}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4749348225721508, "4": 0.4404308176866507, "2": 0.06064226419724563, "5": 0.020853255580014704, "1": 0.0031258000892609114}, "score": 3.4152488792642584}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7642767478509651, "5": 0.17366795630221313, "3": 0.061402667509046056, "2": 0.0006235715774465586, "1": 2.363029459150405e-05}, "score": 4.110947856809243}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"3": 0.510050519666548, "2": 0.3413700839582926, "4": 0.12842782571869082, "1": 0.017514597550780706, "5": 0.0026368137595151847}, "score": 2.757302135504891}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5255101520565882, "3": 0.3491277073759989, "1": 0.07315769223781382, "4": 0.050626739178617146, "5": 0.0015777397407138619}, "score": 2.3819567010336073}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4814574121222399, "4": 0.4156110217571826, "2": 0.06751538372726036, "5": 0.026518899805203566, "1": 0.008897099092842283}, "score": 3.3833393097955953}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5445772899686752, "4": 0.32693948054476063, "2": 0.10434714559267975, "1": 0.012450851062176489, "5": 0.011683605022707655}, "score": 3.2210582027136754}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4911625730416342, "2": 0.43164430411393695, "4": 0.051424889099181824, "1": 0.024915118277983834, "5": 0.0008527211235304505}, "score": 2.5716556217614173}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6293956536000496, "5": 0.24784956738205768, "3": 0.117251474035902, "2": 0.0045375593481255415, "1": 0.0009468757283995356}, "score": 4.118684587031644}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8347584895828721, "4": 0.16050291092053343, "3": 0.004657730344633686, "2": 1.218306116602592e-05, "1": 0}, "score": 4.8301334117347965}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5259693909752045, "4": 0.4634904492063836, "3": 0.010478709992336785, "2": 1.2525362115426179e-05, "1": 0}, "score": 4.515490850372168}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7860902509916581, "4": 0.21065121978438717, "3": 0.0032423594139989425, "2": 5.239015285004886e-06, "1": 0}, "score": 4.782845970675654}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.69634782146062, "5": 0.288774463112154, "3": 0.014861482205747045, "2": 1.2761164786567835e-05, "1": 0}, "score": 4.273888409532919}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6965557401737209, "4": 0.25279310287823364, "3": 0.042922041376091694, "1": 0.004064055143595118, "2": 0.0036372804707122115}, "score": 4.634184590046471}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5401856511948505, "4": 0.4217591341731796, "3": 0.03578083729405464, "2": 0.0017007764447236214, "1": 0.0005592052380759141}, "score": 4.499332833520381}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5497877963628363, "5": 0.42011300263515694, "3": 0.029190195401903384, "2": 0.0007481518444425382, "1": 0.00014535987410032206}, "score": 4.388996450987007}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6108355224963893, "4": 0.33596002476855474, "3": 0.04821995208039159, "2": 0.003321077501711488, "1": 0.001644152870087357}, "score": 4.55105157572205}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8413068603460341, "4": 0.15325193160058442, "3": 0.0053255994550728165, "2": 5.765151686347193e-05, "1": 0}, "score": 4.835914405016486}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9365307992737179, "4": 0.06216282044486327, "3": 0.0012819704124014857, "2": 1.0933227622093364e-05, "1": 7.326416814426583e-06}, "score": 4.935210734911678}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7746078869410424, "4": 0.214316196656544, "3": 0.010913132483000137, "2": 0.00011339865810838821, "1": 3.599771837459991e-05}, "score": 4.763370183637807}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7452075267478161, "4": 0.22582358090801619, "3": 0.028745530060010464, "2": 0.00019631922983847914, "1": 2.105730557188088e-05}, "score": 4.7160104721702}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9037346097287003, "4": 0.09430421429918541, "3": 0.0019348729762576995, "2": 1.4865373138691924e-05, "1": 6.852047810013251e-06}, "score": 4.901753584921347}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8233905388971462, "4": 0.16924283532351714, "3": 0.007271186469470697, "2": 6.554458236920449e-05, "1": 2.262242244389404e-05}, "score": 4.815926329660775}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"4": 0.570992159839044, "3": 0.20979842294351084, "5": 0.19820700789838333, "2": 0.01499469210754458, "1": 0.005995362651531821}, "score": 3.9404323768534155}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5794381800369035, "4": 0.3420417066793245, "3": 0.07368753689420182, "2": 0.0033937831716317484, "1": 0.0014158078387742213}, "score": 4.494727024771363}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4866591199598079, "4": 0.41078315792637016, "3": 0.0915658402399346, "2": 0.007391415645897705, "1": 0.003531145346140071}, "score": 4.369742643275747}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8818674038922198, "4": 0.06838053984657072, "3": 0.02857895989213699, "1": 0.0175150109001604, "2": 0.00360301602335553}, "score": 4.793581081323043}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5254032583994124, "4": 0.23225857048231185, "3": 0.17445935275059934, "2": 0.037249401552139474, "1": 0.03061400178518265}, "score": 4.1846059428952}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"5": 0.678280018275041, "4": 0.3023797503642712, "3": 0.019149719710308735, "2": 0.00017173671167760291, "1": 1.49818513409224e-05}, "score": 4.658744378262328}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9713463462712701, "4": 0.028529937626547642, "3": 0.00012231681927408835, "2": 2.0159945583177263e-07, "1": 0}, "score": 4.971224789472943}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8655495464167763, "4": 0.13315372382113166, "3": 0.0012686955910439042, "2": 2.3806523766629646e-06, "1": 0}, "score": 4.864298261812576}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9936063254793587, "4": 0.006296253531595408, "3": 6.912936179527685e-05, "2": 2.700377696874816e-07, "1": 0}, "score": 4.99356449729849}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9290932820133158, "4": 0.07018218325144265, "3": 0.000715570808644956, "2": 2.0952346627578218e-06, "1": 0}, "score": 4.928379897490859}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8174597033204668, "4": 0.18095767768543017, "3": 0.0015692021084238491, "2": 7.2839591812988494e-06, "1": 0}, "score": 4.8158809370314986}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7741326636617074, "4": 0.22271347480852077, "3": 0.0031326953838584637, "2": 1.1178078214044872e-05, "1": 0}, "score": 4.770985312774919}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9919868329710713, "4": 0.007946843286896672, "3": 4.634245789058983e-05, "1": 0, "2": 0}, "score": 4.991960311154015}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9922947346339439, "4": 0.007649591739143549, "3": 5.429116779300657e-05, "2": 1.3944786962090087e-07, "1": 0}, "score": 4.992241397937631}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9160708776081518, "4": 0.08322577362333486, "3": 0.0006776531358341546, "2": 1.7463633813634427e-06, "1": 0}, "score": 4.915411655185804}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9240379285210056, "4": 0.07501175082888736, "3": 0.0009449538194230729, "2": 1.4938124718232845e-06, "1": 0}, "score": 4.923093562234817}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8094089573073401, "4": 0.18515817855653743, "3": 0.005416455198031554, "2": 1.2542207519685285e-05, "1": 0}, "score": 4.803970526431683}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.76714985392769, "4": 0.22880499235068694, "3": 0.004019555317528506, "2": 2.642939006454024e-06, "1": 0}, "score": 4.763142531023877}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9307970470919475, "4": 0.06834003637704937, "3": 0.0008352356143854516, "2": 1.3449375193558666e-06, "1": 0}, "score": 4.929983613631534}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9580264804547745, "4": 0.04148856217391842, "3": 0.00045964252047725067, "2": 6.508959750864209e-07, "1": 0}, "score": 4.957589154078013}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8585670245476187, "4": 0.13662665761087792, "3": 0.004769406525293186, "2": 2.5528680815012402e-05, "1": 8.844630555183932e-06}, "score": 4.85372219352009}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9341810087610176, "4": 0.06501685077446506, "3": 0.0007798932551637043, "2": 2.8358410446537183e-06, "1": 0}, "score": 4.933413562658214}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.972330490023366, "4": 0.026283962938180343, "3": 0.0013088710594501148, "2": 7.499231570033397e-06, "1": 0}, "score": 4.971073796227516}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9364073351920726, "4": 0.061107724310575894, "3": 0.002446659877234372, "2": 1.719821428799484e-05, "1": 0}, "score": 4.933945968714197}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9875456030197219, "4": 0.011763538369585774, "3": 0.0006660552053121889, "1": 8.56992994357514e-06, "2": 0}, "score": 4.986869858352184}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5361563514399345, "4": 0.38850466559228286, "2": 0.05402334559556273, "5": 0.01963602086888349, "1": 0.001665466191243668}, "score": 3.3704276710191525}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6297146302969967, "3": 0.30554335363905977, "5": 0.0422349416229364, "2": 0.02107886920024418, "1": 0.0014270288834678803}, "score": 3.6902523985591342}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6121018125073652, "4": 0.3696686555895394, "3": 0.018118550066029367, "2": 0.00010258313653435441, "1": 7.233561809630167e-06}, "score": 4.593757087292212}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7012311521576391, "5": 0.23491794406616756, "3": 0.06279919651104153, "2": 0.0009383354971874752, "1": 8.609923771965806e-05}, "score": 4.169988414861779}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.46616356900329625, "4": 0.393977254912123, "2": 0.09698681864212955, "5": 0.033329429617341345, "1": 0.00954066585343518}, "score": 3.3445687432025433}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6770992595851477, "5": 0.2945966931198926, "3": 0.028240758716116306, "2": 5.369009629470114e-05, "1": 0}, "score": 4.266251109817818}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7588879279491135, "3": 0.1314846715918616, "5": 0.10751296865924823, "2": 0.0020061729034725603, "1": 0.00010543593928962576}, "score": 3.971699563551657}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8072781891324143, "5": 0.14056353303452057, "3": 0.05202185293138362, "2": 0.00012998402495775652, "1": 5.920000645684723e-06}, "score": 4.088263998025889}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8911284571656601, "4": 0.10771055455922947, "3": 0.001155330764287117, "2": 8.449182160609198e-07, "1": 0}, "score": 4.88997571965551}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.756586431849836, "5": 0.21113771092133163, "3": 0.032149843375178566, "2": 0.00010924494446272763, "1": 0}, "score": 4.178772375474958}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5515815178831868, "5": 0.415372010269187, "3": 0.03250839224685847, "2": 0.0004557770925930508, "1": 4.216652070551875e-05}, "score": 4.381840889836196}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4964372441306115, "5": 0.49577487814359844, "3": 0.007701613705013378, "2": 5.071909961819848e-05, "1": 0}, "score": 4.487989171775986}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8857184636422047, "5": 0.09136418740564067, "3": 0.022752585310949085, "2": 0.00012797162478330964, "1": 0}, "score": 4.068358173880181}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9229108004948157, "4": 0.07618663693312906, "3": 0.0008806295575203329, "2": 5.688266577002027e-06, "1": 0}, "score": 4.922033772610387}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8978469226192185, "4": 0.10052680204728619, "3": 0.0016057381846561664, "2": 8.629594855769182e-06, "1": 0}, "score": 4.896234597206699}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"5": 0.749684468230989, "4": 0.24739139533611582, "3": 0.002896688763604583, "2": 1.9851479889159623e-05, "1": 3.896109760374896e-06}, "score": 4.746739151172655}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.881946872544391, "4": 0.1152418287310817, "3": 0.002765659929422645, "2": 2.230642063695043e-05, "1": 0}, "score": 4.879157112596661}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8249653694110066, "4": 0.17255380122141764, "3": 0.0023736106550850296, "2": 1.5592788909032108e-05, "1": 0}, "score": 4.8226359479566066}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7585430841703907, "4": 0.23673384163378647, "3": 0.004678790699433157, "2": 2.5875887692776604e-05, "1": 8.431684363813304e-06}, "score": 4.7537947664420335}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9295005259304321, "4": 0.06935656305508026, "3": 0.0011324475671513374, "2": 4.81642792040662e-06, "1": 0}, "score": 4.928363687995211}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6177229827468798, "3": 0.30872881771024036, "5": 0.05563908817508397, "2": 0.01705163134109526, "1": 0.0008380158027190755}, "score": 3.710287321342028}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5216195125705967, "3": 0.41612366136420936, "5": 0.03347040042940576, "2": 0.02805928179406902, "1": 0.000711311079454991}, "score": 3.5590872613721234}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5158087096324309, "3": 0.4481560416309882, "2": 0.019161529152396627, "5": 0.016448351821702595, "1": 0.00041219443101278265}, "score": 3.5287264603503328}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6698150831428628, "3": 0.2828137288478391, "5": 0.0445298468014124, "2": 0.0027797888705748714, "1": 4.2705023426524425e-05}, "score": 3.7560238268466293}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4802280421913881, "4": 0.46617084121169583, "2": 0.03084786305227384, "5": 0.02194428144121573, "1": 0.0007976695053472367}, "score": 3.4776216003961427}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8229302769986375, "4": 0.17445432839359123, "3": 0.0024571026689787045, "2": 3.500642296589791e-05, "1": 0}, "score": 4.820504317781783}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9683113944062332, "4": 0.03137774799084455, "3": 0.0002909139613425379, "2": 2.439798753827999e-06, "1": 0}, "score": 4.968032545136904}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7920614910237909, "4": 0.20405783916602044, "3": 0.0037891809174962518, "2": 6.012198357666155e-05, "1": 1.852062651897748e-05}, "score": 4.788106628500051}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9670357347226489, "4": 0.03229021615682747, "3": 0.0006494442245389069, "2": 9.729130777814653e-06, "1": 0}, "score": 4.966381207896504}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8707113306213101, "4": 0.12656933730371647, "3": 0.0026531172753437872, "2": 4.2730312285156555e-05, "1": 1.4855906911316098e-05}, "score": 4.867935674053437}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"4": 0.613546974322191, "3": 0.3433477833105259, "5": 0.025803986073898263, "2": 0.016579592622384107, "1": 0.0006831855952145685}, "score": 3.6472338869717285}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6534994549275491, "5": 0.3223415762102115, "3": 0.024047308533064346, "2": 9.038276151100276e-05, "1": 0}, "score": 4.298119845419308}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6724254894509346, "5": 0.31280233672200286, "3": 0.014709985942671625, "2": 3.650187240224198e-05, "1": 0}, "score": 4.298027002159677}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6652407724639633, "5": 0.313679379227286, "3": 0.0209654863592464, "2": 9.105279999359148e-05, "1": 0}, "score": 4.292538606094159}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6430179622916097, "5": 0.32088332353833837, "3": 0.03584780289025279, "2": 0.00018438418779560714, "1": 0}, "score": 4.2846856915836895}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5249557162227939, "4": 0.4519121845473423, "3": 0.023049640642686286, "2": 6.555297261271188e-05, "1": 1.0085830902665563e-05}, "score": 4.501748133955901}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7542391395894226, "5": 0.22350104261395465, "3": 0.022148940867498225, "2": 9.457881971976192e-05, "1": 1.3841205624111412e-05}, "score": 4.201121914627337}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5951909503285275, "4": 0.39429113154299505, "3": 0.01042175323596547, "2": 4.5274300696570136e-05, "1": 0}, "score": 4.5847084046479205}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.59748744974975, "5": 0.36993839026720454, "3": 0.032350267148542666, "2": 0.00018958255156289796, "1": 2.8271961617589448e-05}, "score": 4.337126177806872}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5095031977947478, "4": 0.4641185795642096, "3": 0.026287658723177048, "2": 7.9338186536673e-05, "1": 6.6946825227351555e-06}, "score": 4.483038967324066}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.46787500596893594, "3": 0.3011841521935225, "5": 0.18396414582637938, "2": 0.033198177471607915, "1": 0.013767658834190715}, "score": 3.7750782196028045}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6471138331520855, "4": 0.3440743882752926, "3": 0.008750950114440494, "2": 4.423138292051618e-05, "1": 0}, "score": 4.638285013936218}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6762063486743901, "3": 0.1768753556225148, "5": 0.14283860821037186, "2": 0.003644380087506784, "1": 0.00039318929318838005}, "score": 3.9574931342243436}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6874757794176247, "5": 0.23817147060354554, "3": 0.07287549805215106, "2": 0.0013069064800984268, "1": 0.0001665923079609521}, "score": 4.162182991362563}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7168076822171575, "5": 0.20895812624194615, "3": 0.07264169577800979, "2": 0.0015179080120004686, "1": 7.359047178889851e-05}, "score": 4.133059975722501}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7480879408028329, "3": 0.15296333910415252, "5": 0.09656885516975568, "2": 0.0022410815383934047, "1": 0.0001284394462633395}, "score": 3.9387374009534635}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8742235919628967, "4": 0.1248579484857125, "3": 0.0009143616375950146, "2": 6.599076077386406e-07, "1": 0}, "score": 4.873310912958408}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7430818639880024, "4": 0.24275178951364404, "3": 0.014067677345262958, "2": 7.413602325497556e-05, "1": 0}, "score": 4.728883796397041}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8309854610564645, "4": 0.1675833566269969, "3": 0.0014135245680175995, "2": 1.87602759124823e-06, "1": 0}, "score": 4.829581276653461}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5627041035288545, "4": 0.41607219005086504, "3": 0.021117058614285533, "2": 6.1034089843253834e-05, "1": 0}, "score": 4.541489676091267}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4695570854368911, "4": 0.4216217474287819, "3": 0.10374030188994778, "2": 0.003942677176489565, "1": 0.0010879660881651532}, "score": 4.35468534392962}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6913899412365455, "4": 0.2834786123801586, "3": 0.02494979682760324, "2": 0.0001440021972246744, "1": 3.326539135739025e-05}, "score": 4.666055262472675}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7256482033405467, "4": 0.2647806848471076, "3": 0.009499346236064748, "2": 3.739728312122468e-05, "1": 0}, "score": 4.7160986736273856}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5478378445106757, "5": 0.3975556717410612, "3": 0.05384252481308098, "2": 0.0007066182467951122, "1": 5.265991594923626e-05}, "score": 4.342143532182558}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5797117394128148, "5": 0.20897962913944154, "3": 0.20497669279300607, "2": 0.005517775439555579, "1": 0.0007909454942235392}, "score": 3.9905943306064464}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5029756397377483, "4": 0.4015383071738516, "5": 0.08387118240640523, "2": 0.011289023466499473, "1": 0.00032416205417729483}, "score": 3.5573442636268013}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8061514990956746, "4": 0.18824115477368678, "3": 0.005592804042289936, "2": 9.619425638564444e-06, "1": 0}, "score": 4.800543397007236}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9154216959351839, "4": 0.0815945996468931, "3": 0.002939711005241416, "2": 3.8712620228010655e-06, "1": 0}, "score": 4.912510854303871}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5096980435896958, "4": 0.4619640337300269, "3": 0.02819181193823341, "2": 0.00013654879973685975, "1": 9.11802804858878e-06}, "score": 4.481205993582045}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5698248762550703, "5": 0.37896451736906644, "3": 0.050837907095559284, "2": 0.000349208532456631, "1": 1.869063428388788e-05}, "score": 4.327373692736646}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8662610174516508, "4": 0.13009519854822746, "3": 0.0035865089031307078, "2": 2.4126614275589388e-05, "1": 0}, "score": 4.8626548510193865}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5126323281651184, "5": 0.46210646995633714, "3": 0.02478680806997173, "2": 0.0003917138340277564, "1": 7.66193425029846e-05}, "score": 4.436309020499231}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8130927762633302, "4": 0.17391703566482136, "3": 0.012848214843196567, "2": 0.00010583915732195231, "1": 2.3114741125563882e-05}, "score": 4.799973954007175}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9102897350334315, "4": 0.08791984780065665, "3": 0.0017665748855803353, "2": 1.1783975003852198e-05, "1": 0}, "score": 4.908510547295416}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8253695281676695, "4": 0.1675420356663365, "3": 0.0069496637630015205, "2": 9.657738054629654e-05, "1": 3.0304389134968636e-05}, "score": 4.818145524744601}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7388744235577341, "5": 0.21794062841638054, "3": 0.042805186663923994, "2": 0.0003479304341641459, "1": 2.7790870235517365e-05}, "score": 4.1743569126853854}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7661812871079999, "4": 0.23170422799447513, "3": 0.0021007349905224756, "2": 7.854837295231412e-06, "1": 0}, "score": 4.7640693466849475}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7533736191996909, "4": 0.24334959669702985, "3": 0.0032538284217066235, "2": 1.457284051997514e-05, "1": 0}, "score": 4.750096933040308}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9850838623426911, "4": 0.014847196788553653, "3": 6.836565358641792e-05, "2": 2.2451237697320743e-07, "1": 0}, "score": 4.985015393111999}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5616174583208885, "5": 0.41732044460560686, "3": 0.020875835188826034, "2": 0.00015943663299115634, "1": 1.8682655086728486e-05}, "score": 4.396072913247496}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4700404801538124, "4": 0.4377600280113904, "3": 0.08960516639545536, "2": 0.0020395256962438602, "1": 0.0005414203466188157}, "score": 4.374737015081114}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9126429210334014, "4": 0.08020713523898078, "3": 0.006951867155633671, "2": 0.00013315928696439104, "1": 6.22069393082918e-05}, "score": 4.9052405680008055}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.45601473335530657, "5": 0.453376533035328, "3": 0.089507693186893, "2": 0.0009302101775359897, "1": 0.00013411861003664348}, "score": 4.361619339300411}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4555809779167039, "5": 0.4471921101831656, "3": 0.0943449625207448, "2": 0.0023791968648312115, "1": 0.0004746945563648164}, "score": 4.346674397239407}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.680075783974785, "4": 0.28468445144816024, "3": 0.034355598142903475, "2": 0.0005846263691455446, "1": 0.0002373710569567036}, "score": 4.643878849232079}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6706360959828995, "2": 0.16573340095481612, "4": 0.15687850919119747, "5": 0.003666867586628186, "1": 0.003082610117885554}, "score": 2.9923136038336136}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.478068715761252, "3": 0.45407386315501913, "5": 0.05774420389914192, "2": 0.009402098217379631, "1": 0.0007091889959709565}, "score": 3.582737772017353}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5815666478031978, "4": 0.3338179147771382, "2": 0.05838069551755214, "5": 0.023857424745759068, "1": 0.002375909422623141}, "score": 3.318400698129261}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.626700439787824, "4": 0.24123420799347162, "2": 0.11702674272540335, "5": 0.01168638254571709, "1": 0.00335160481030404}, "score": 3.1408771083837954}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5815166352220585, "5": 0.23968672998610277, "3": 0.17541343598691245, "2": 0.003200747188584017, "1": 0.00017837544275713696}, "score": 4.057336907008936}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8258455982436496, "3": 0.12770318180564197, "5": 0.044122606889425126, "2": 0.002263545929344254, "1": 6.278452073399763e-05}, "score": 3.9117037781169466}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7520314004398462, "5": 0.17411961037177073, "3": 0.07319779363994076, "2": 0.0006018923194502137, "1": 0}, "score": 4.099722948756309}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7943767293867762, "3": 0.15157823267818632, "5": 0.05201962124176295, "2": 0.0019578996254558147, "1": 6.33036226875954e-05}, "score": 3.8963352416588304}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8529172557548734, "5": 0.09454264277189296, "3": 0.05235400710954716, "2": 0.00016899270663134374, "1": 0}, "score": 4.041851365976791}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.800003817060474, "5": 0.1338920768739856, "3": 0.06554443299444233, "2": 0.0004926332872286966, "1": 0}, "score": 4.067366893567071}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8412783405268821, "5": 0.11871706760034323, "3": 0.03992376573295521, "2": 5.1831162340311765e-05, "1": 0}, "score": 4.078691921213191}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7508641167553161, "5": 0.21457702803898676, "3": 0.034493564795842806, "2": 4.678209564162818e-05, "1": 0}, "score": 4.179993230423126}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5551064787686782, "4": 0.43758527845345585, "3": 0.007284743859058315, "2": 6.2116810386236765e-06, "1": 0}, "score": 4.5478187818210785}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6030491358015566, "4": 0.3879167594016365, "3": 0.00901478744978234, "2": 1.0177623724235845e-05, "1": 0}, "score": 4.594019422277481}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6344781937693946, "4": 0.3541075140336643, "3": 0.011350766548755302, "2": 1.2046817991438562e-05, "1": 0}, "score": 4.623135411866713}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4814969125086141, "5": 0.44061601372788645, "3": 0.07297661730752844, "2": 0.0027781640030985445, "1": 0.002094945584355545}, "score": 4.355811520107153}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9472653001845907, "4": 0.051597265607575556, "3": 0.0010480499835432094, "1": 8.672564680635185e-06, "2": 0}, "score": 4.946267607336028}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5159333956652491, "5": 0.3667570277158123, "3": 0.1008850327589281, "1": 0.008600559669425254, "2": 0.0075571473096101805}, "score": 4.225016063914052}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6631239652697677, "4": 0.3225342328524373, "3": 0.014212960775375783, "2": 6.048706605484614e-05, "1": 0}, "score": 4.6488343808111425}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7596389229346251, "4": 0.2306151442638045, "3": 0.009282073682322839, "2": 0.00022408726636275584, "1": 0.00019659613689734204}, "score": 4.7493512400852005}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9511452729560269, "4": 0.04811955190266309, "3": 0.0007308853137922669, "2": 1.976410969000665e-06, "1": 0}, "score": 4.950412633520612}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.985892874336036, "4": 0.014021388011910857, "3": 8.219015762445082e-05, "2": 2.7517570941223395e-07, "1": 0}, "score": 4.985813359722504}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8906775088123886, "4": 0.10900029394647262, "3": 0.00031403377944241986, "2": 2.854552678959502e-07, "1": 0}, "score": 4.890369918462352}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9889502479839102, "4": 0.010996895206274084, "3": 3.067882134199422e-05, "1": 0, "2": 0}, "score": 4.988941501895797}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.896003105547839, "4": 0.10226272928733611, "3": 0.0017226604670932493, "2": 7.790932503864153e-06, "1": 2.307223971599789e-06}, "score": 4.89425919935628}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.38817217025916695, "5": 0.289044477883627, "3": 0.20222943688097056, "2": 0.060679073089849093, "1": 0.05984666925932632}, "score": 3.7859108555913568}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.557642167047481, "5": 0.3920719931733182, "3": 0.04632776136780366, "2": 0.0025679648010617897, "1": 0.0013649315474376681}, "score": 4.336521981878792}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.36576285234501466, "3": 0.23556761363560164, "2": 0.16376470614176325, "5": 0.13808530950549938, "1": 0.09680591317952239}, "score": 3.2845608103598365}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8067222386370547, "4": 0.12623386764765876, "3": 0.04392617478583647, "1": 0.015334301988399539, "2": 0.007771729130833347}, "score": 4.701257895793552}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3996090319442829, "3": 0.2987116357147597, "2": 0.16159281427562033, "1": 0.08744955204005497, "5": 0.05258954201571492}, "score": 3.1683041792789908}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6374609236905049, "4": 0.34430967793996214, "3": 0.01801507809126844, "2": 0.0001737772936674911, "1": 2.989964352139728e-05}, "score": 4.619015180471034}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.793734798860904, "4": 0.19661008018990922, "3": 0.00957309231305564, "2": 4.780224275532902e-05, "1": 0}, "score": 4.784092938735702}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7417942836568118, "3": 0.14277523050060215, "5": 0.11207537981616514, "2": 0.003123722123201846, "1": 0.0002240980228096938}, "score": 3.9623801369069067}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.772580761533748, "4": 0.20695760778478473, "3": 0.02020985544983808, "2": 0.00016256689164549474, "1": 5.451514527208882e-05}, "score": 4.751908312966311}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7702692884610084, "4": 0.20144636735435933, "3": 0.02804357299513856, "2": 0.00017981787946854639, "1": 3.262632761399786e-05}, "score": 4.74178921337409}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6619011198412676, "5": 0.2566382174627658, "3": 0.07882003997871846, "2": 0.002121549205203013, "1": 0.0004996531501315384}, "score": 4.172079461468667}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6992160640533875, "5": 0.17331058587905937, "3": 0.1228290534057937, "2": 0.0038531202668687183, "1": 0.0007620091457904374}, "score": 4.040490445497067}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.669594710051577, "5": 0.27240683860796705, "3": 0.05627396973738612, "2": 0.0011219619332969606, "1": 0}, "score": 4.214017894995404}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.524915227949852, "5": 0.3621281225784538, "3": 0.10144552744305348, "2": 0.008088338063335972, "1": 0.003366465156834411}, "score": 4.234419725777863}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6108986739369466, "3": 0.18539119850158434, "5": 0.17312822050822138, "2": 0.023981878412165276, "1": 0.006594205302985121}, "score": 3.9199901833491375}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8240074399894644, "4": 0.17468800932533307, "3": 0.0012938880517198265, "2": 6.646919790502346e-06, "1": 0}, "score": 4.822703561840122}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9601604836720173, "4": 0.039655505027360864, "3": 0.0001808112298378596, "2": 1.0044524407544429e-06, "1": 0}, "score": 4.959979771286493}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9066895406684536, "4": 0.09267399262315963, "3": 0.0006165129067844668, "2": 2.93335423384258e-06, "1": 0}, "score": 4.9060825829841175}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9953627892170558, "4": 0.004628207661402284, "3": 7.488762457907522e-06, "1": 0, "2": 0}, "score": 4.995356807782223}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7971753993005789, "4": 0.20125788164437936, "3": 0.0015396383927982805, "2": 7.225139617001719e-06, "1": 0}, "score": 4.795637108419155}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"5": 0.622719626009769, "4": 0.3302712805358012, "3": 0.04646141945087171, "2": 0.0004804888667296437, "1": 3.5038433463057486e-05}, "score": 4.575210604649729}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9728695127111272, "4": 0.02649579335265386, "3": 0.00040829304247977876, "2": 1.2919084684066174e-06, "1": 0}, "score": 4.972677594317963}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7570623457145514, "4": 0.22960771802735042, "3": 0.013254999194641445, "2": 3.9566173867565406e-05, "1": 0}, "score": 4.743754521431233}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7513603841122469, "4": 0.2434095410845446, "3": 0.00519842283687836, "2": 1.5282991723013315e-05, "1": 0}, "score": 4.746143608897709}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8460070805216527, "4": 0.1480303142764223, "3": 0.005863600759620035, "2": 3.433439282150799e-05, "1": 0}, "score": 4.8401291421695865}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7634850006732905, "4": 0.2297396425856913, "3": 0.0067524944109412025, "2": 1.5512071976218073e-05, "1": 3.8134395768758594e-06}, "score": 4.756692718084489}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9842295092683445, "4": 0.015347771417759564, "3": 0.0003745196074633915, "2": 9.627211797894074e-07, "1": 0}, "score": 4.983899540666614}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9964348054518569, "4": 0.0035242909918940793, "3": 3.8741894431753835e-05, "2": 1.968785097940676e-07, "1": 0}, "score": 4.996397627505832}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9879598783661286, "4": 0.011941451646188378, "3": 8.918613211747363e-05, "1": 0, "2": 0}, "score": 4.987880061145827}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9559827213459317, "4": 0.0431727530134129, "3": 0.0008145872619957132, "2": 2.0711552801868e-06, "1": 0}, "score": 4.955190610283482}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7029412718447372, "5": 0.18023022816725542, "3": 0.11497373132181786, "2": 0.0017716261949210805, "1": 7.489892649903144e-05}, "score": 4.0614890545638715}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6852295276392503, "5": 0.2104190837495667, "3": 0.10333152193355248, "2": 0.0009304055421858426, "1": 6.059089037703897e-05}, "score": 4.105048010822329}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.759881696741965, "5": 0.20635159360253827, "3": 0.03333355272279381, "2": 0.00013629887134005455, "1": 0}, "score": 4.172796739242085}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6063086919211724, "4": 0.3602291580158493, "3": 0.03321700285396703, "2": 0.0002146407194416254, "1": 1.943760434126253e-05}, "score": 4.572610432974463}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6282576663041113, "5": 0.3298847592186927, "3": 0.04163376842553596, "2": 0.0001468427898889484, "1": 0}, "score": 4.28797946905264}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.750118218654957, "5": 0.20514993026828407, "3": 0.043953395481856325, "2": 0.0006885603426434161, "1": 8.481747188578704e-05}, "score": 4.159565771925428}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8223608088707369, "5": 0.15642192113230988, "3": 0.02114664531538832, "2": 6.58048509306538e-05, "1": 3.6427852148255133e-06}, "score": 4.135132896816972}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5981617121101219, "4": 0.39259840885030056, "3": 0.009187005858485696, "2": 3.518692476171686e-05, "1": 0}, "score": 4.588914748099306}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7402652952038372, "5": 0.24397859083940135, "3": 0.015712888183140962, "2": 3.8495892910898496e-05, "1": 2.4222153564562654e-06}, "score": 4.228181970791998}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8281825482463625, "4": 0.17024792874301528, "3": 0.0015412668050889828, "2": 5.049607704356886e-06, "1": 0}, "score": 4.826650365968452}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6938173760545591, "5": 0.2899220457197087, "3": 0.016195351862203812, "2": 5.027734399105262e-05, "1": 0}, "score": 4.273630229673172}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7319606231343926, "4": 0.2657871442833559, "3": 0.002241088933974685, "2": 4.229685151270791e-06, "1": 0}, "score": 4.729716120060462}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5208460866351436, "4": 0.4705523977770816, "3": 0.008563508511197089, "2": 2.8056197658762456e-05, "1": 0}, "score": 4.5122315628828895}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9376763764056651, "4": 0.06207597133161878, "3": 0.0002409268975874445, "2": 6.343893209972728e-07, "1": 0}, "score": 4.93743989065313}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6862994846352517, "4": 0.31138997917914724, "3": 0.0022890914199343512, "2": 8.382737719385699e-06, "1": 0}, "score": 4.684002562200463}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7528391923233974, "4": 0.19470696388233197, "3": 0.04810445916665063, "2": 0.0024250006173873536, "1": 0.001864714165684118}, "score": 4.694332020108625}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8134297673317031, "4": 0.17220037659983264, "3": 0.013797939631925786, "2": 0.00036683478073795103, "1": 0.00020404397982055704}, "score": 4.798286854561934}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6662456184226704, "4": 0.3121332184787415, "3": 0.02148155970527874, "2": 0.00010940379274236047, "1": 2.5281465996477622e-05}, "score": 4.644472576336775}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8511718090588563, "4": 0.14005099117601394, "3": 0.008370304627347249, "1": 0.000226446011789127, "2": 0.00017810558666940795}, "score": 4.841767927939043}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7945138029726628, "4": 0.19303261784087763, "3": 0.01205150175306952, "2": 0.0002493886587226294, "1": 0.0001516770452201036}, "score": 4.7815092834424435}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5541555474906845, "3": 0.35166808098143876, "4": 0.06664934898980142, "1": 0.025619469223495315, "5": 0.0019061939906391508}, "score": 2.4650665238855236}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5360808713007643, "5": 0.32361630784387185, "3": 0.11766478527606888, "2": 0.01993672640884753, "1": 0.0026876743855149435}, "score": 4.158017201124116}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5653673398901202, "4": 0.42092658623286916, "3": 0.013512555347540506, "2": 0.00017559119858020779, "1": 1.2856783333889462e-05}, "score": 4.551467828039266}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.525736916558242, "5": 0.45624746055854726, "3": 0.017851299005267548, "2": 0.00015184322255010348, "1": 8.640570044085567e-06}, "score": 4.438068235617461}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6454474382330221, "3": 0.31667413472235184, "5": 0.01890196866824604, "2": 0.01837409843222287, "1": 0.0005952101627966592}, "score": 3.6636916020615446}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.711547054084122, "4": 0.23922470032705168, "3": 0.04201902865864019, "2": 0.004930100035287667, "1": 0.002276108710542422}, "score": 4.6528414630907555}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.773849940122096, "4": 0.21284099380633484, "3": 0.012760953221198568, "2": 0.00039697351196268894, "1": 0.00013050709041441288}, "score": 4.759919197447066}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8729340413552783, "4": 0.11812120744138103, "3": 0.008476975970755753, "2": 0.00032627858053235433, "1": 0.00013642889429246906}, "score": 4.863399597040589}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9284520425323918, "4": 0.06923976103060903, "3": 0.002148882154911734, "2": 8.447778141590643e-05, "1": 4.609749259522508e-05}, "score": 4.926022525305696}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939241944127437, "4": 0.005997917220105848, "3": 7.001136303621992e-05, "2": 1.460366684515674e-06, "1": 0}, "score": 4.993857639540467}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9458625608488821, "4": 0.04102292180843437, "3": 0.006639172146490121, "1": 0.005241749302527162, "2": 0.0012242828928340967}, "score": 4.921058152824486}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9982143174316426, "4": 0.0015321300840633347, "3": 7.325302602491704e-05, "1": 5.260670367754736e-05, "2": 0}, "score": 4.998110695798719}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9923222103655447, "4": 0.0068360828099515965, "3": 0.0006868020802797977, "1": 0.00010608679268182515, "2": 4.004567020628199e-05}, "score": 4.991245752053415}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8895586696867059, "4": 0.09754020763364148, "3": 0.010572993626933192, "1": 0.0014723444274595914, "2": 0.0008337257888638785}, "score": 4.872920446808988}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9433798634664126, "4": 0.054153265643194885, "3": 0.002270094087749472, "1": 7.37961496856525e-05, "2": 7.350398026106103e-05}, "score": 4.9407879200250795}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7929237625412947, "3": 0.14591437527999013, "5": 0.054413679246122046, "2": 0.006409538548208277, "1": 0.000314628965718572}, "score": 3.894733811960982}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5860098972749822, "5": 0.3999229401733866, "3": 0.007920256399544162, "2": 1.3058934792997677e-05, "1": 0}, "score": 4.394395729049399}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6550610379360252, "5": 0.33632299033314095, "3": 0.008569122017388903, "2": 5.908467892514426e-06, "1": 0}, "score": 4.3277554700971494}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6867987499968528, "5": 0.3027235094892126, "3": 0.010441904393420702, "2": 2.5650422878299103e-05, "1": 0}, "score": 4.2922332808498735}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8260873173257951, "5": 0.09856387143368206, "3": 0.07465265422770664, "2": 0.0006492872079094892, "1": 2.5540196846729925e-05}, "score": 4.022536502894389}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7976097310461648, "3": 0.10911053805712044, "5": 0.09068764948375115, "2": 0.0025316156075219152, "1": 5.1991776298258014e-05}, "score": 3.9763577045371914}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.849206606082453, "3": 0.10291164236759938, "5": 0.04686703167851465, "2": 0.0009734442523197537, "1": 3.0261084828464223e-05}, "score": 3.941917077795452}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8314402009607109, "3": 0.135837127886334, "5": 0.030630280515034684, "2": 0.002029105953369253, "1": 5.174012320376534e-05}, "score": 3.890578457128637}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5759911978001341, "5": 0.3979164978924599, "3": 0.025816176174986744, "2": 0.00025568495906047687, "1": 1.1070274663875444e-05}, "score": 4.371559223562322}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.868482085896654, "3": 0.07722637771999616, "5": 0.053694935118864945, "2": 0.0005360216531722588, "1": 0}, "score": 3.9753950235326134}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5773944060334546, "4": 0.39427635773108527, "3": 0.02774301450578913, "2": 0.0004267148356654954, "1": 0.00014384891652109258}, "score": 4.548375001550198}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5189293355997223, "5": 0.44792391212416044, "3": 0.032853532683530834, "2": 0.00021860524257655736, "1": 5.2912179992370764e-05}, "score": 4.4144834276053135}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5798842873003163, "5": 0.35469528862303856, "3": 0.06313603467063457, "2": 0.0017204054314054675, "1": 0.0005560455180879271}, "score": 4.286452580526683}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6548421269211523, "5": 0.31684220660376244, "3": 0.028176217723225403, "2": 0.00011525309751071061, "1": 1.726871629617635e-05}, "score": 4.288385674166327}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.682263337704216, "5": 0.2128367370290266, "3": 0.10224765687190343, "2": 0.00236862774991481, "1": 0.000281052239560398}, "score": 4.105008939744317}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7762683008795932, "5": 0.17596874235015383, "3": 0.04748816295237038, "2": 0.00025937750738487845, "1": 1.1754422561236869e-05}, "score": 4.127927029569776}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5026053044043824, "5": 0.48530183083214357, "3": 0.01206620149137674, "2": 2.156411429758623e-05, "1": 0}, "score": 4.473194914007709}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6948592026887673, "4": 0.30071238578366466, "3": 0.0043901319298016595, "2": 3.0315058157581947e-05, "1": 0}, "score": 4.690413939471818}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.50411050953269, "4": 0.48796735541886943, "3": 0.00788079099558278, "2": 3.482169311575813e-05, "1": 0}, "score": 4.496163311306482}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6665500556052371, "4": 0.32759453797179006, "3": 0.005812460522033163, "2": 1.528173856907206e-05, "1": 0}, "score": 4.660725310018325}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9838313961374029, "4": 0.015499332817742023, "3": 0.0006497525239215299, "2": 3.5316477896484243e-06, "1": 0}, "score": 4.9831902984564795}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995936526740952, "4": 0.003997505649495512, "3": 4.3261390287966826e-05, "1": 0, "2": 0}, "score": 4.995915878834977}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9801772836446898, "4": 0.019187769656011034, "3": 0.0005879492049127244, "2": 2.278830922022178e-06, "1": 0}, "score": 4.979628584458921}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988257038260017, "4": 0.0011353338844353367, "3": 2.2984671976649975e-05, "1": 0, "2": 0}, "score": 4.998818677896898}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9972109047734261, "4": 0.0027305506140330236, "3": 5.506435311930744e-05, "2": 3.079913927439033e-07, "1": 0}, "score": 4.9971583876911945}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7904245601238886, "3": 0.13453724550799182, "5": 0.07349344944002693, "2": 0.0014708132498161312, "1": 0}, "score": 3.936009846532964}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7833931043480168, "3": 0.19061486504708228, "5": 0.023743487419993544, "2": 0.0022259711203500144, "1": 2.1187588411884588e-05}, "score": 3.8286128800855965}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8923962130405982, "3": 0.09542506492250134, "5": 0.011872213609559725, "2": 0.000275882088254302, "1": 0}, "score": 3.9158928086151867}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.748962644904765, "5": 0.19930961680845535, "3": 0.05129112724251442, "2": 0.0004066793178181807, "1": 1.5105222696554397e-05}, "score": 4.147161997160118}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6384426419773036, "3": 0.33091405165400045, "5": 0.025022371356432795, "2": 0.0055119710360086345, "1": 0.00010494921410560898}, "score": 3.6827682563781012}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"5": 0.839170521016295, "4": 0.1535125893513065, "3": 0.007221771471564046, "2": 5.128608962319345e-05, "1": 0}, "score": 4.831882640504622}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7873999531280478, "4": 0.20711056456069188, "3": 0.005455778264159841, "2": 1.4879249003914882e-05, "1": 0}, "score": 4.781929136023992}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8679730961682645, "4": 0.13000469679329568, "3": 0.002006649225457028, "2": 4.312210104548438e-06, "1": 0}, "score": 4.865967560849893}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.588440242202028, "4": 0.4028919206406191, "3": 0.008634227783887649, "2": 2.2806818721111446e-05, "1": 0}, "score": 4.579766663741822}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8558381738098692, "4": 0.14170847848849683, "3": 0.002422574648548044, "2": 6.461493984224598e-06, "1": 0}, "score": 4.85342342422737}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"2": 0.34675000686121027, "3": 0.3196727061115072, "1": 0.19506344780145918, "4": 0.12117403027073352, "5": 0.017327663644665404}, "score": 2.418945398007421}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5354690967017529, "2": 0.31471280065506685, "3": 0.11694064273144192, "4": 0.026078952698398647, "5": 0.006783278766802617}, "score": 1.653974018288731}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.42608409759549176, "2": 0.36638385903668225, "3": 0.14897112258116663, "4": 0.04911122771284632, "5": 0.00943366410010875}, "score": 1.8494080588774295}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.5697931948727011, "2": 0.25463292008997873, "3": 0.10377100318730992, "4": 0.04898112789788475, "5": 0.022817910572051268}, "score": 1.700392644321591}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8385931773840087, "2": 0.12994026943473536, "3": 0.02507770185479175, "4": 0.0038621085043208, "5": 0.0025215726617192776}, "score": 1.201769332483976}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.599975390764287, "5": 0.38704384414697757, "3": 0.012875281095634836, "2": 3.8646629207274535e-05, "1": 0}, "score": 4.374116274738522}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5715491486828244, "4": 0.3998924512106818, "3": 0.028289832910379866, "2": 0.00015383514745276122, "1": 0}, "score": 4.543013946580081}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8030236527417509, "5": 0.16875108831098715, "3": 0.028135481846862195, "2": 8.10463779388148e-05, "1": 0}, "score": 4.1404547399795995}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5835660134874916, "5": 0.3601986118784241, "3": 0.05564898724936688, "2": 0.0005378197990032895, "1": 3.21863534868738e-05}, "score": 4.303382395748067}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5459846211641157, "5": 0.3964043233706034, "3": 0.0569751540520842, "2": 0.0005451628503247002, "1": 0}, "score": 4.338369546784265}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4941657459255004, "4": 0.39695217561389434, "2": 0.08542258088203694, "5": 0.014580945578676884, "1": 0.008872411039824528}, "score": 3.3229486470243073}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5021289599253532, "5": 0.4822373493963461, "3": 0.015544251300433748, "2": 8.013106110245194e-05, "1": 0}, "score": 4.466537178649549}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6811994756080848, "3": 0.15909929099444858, "5": 0.15414491693360247, "2": 0.005355201218346759, "1": 0.000193043115043566}, "score": 3.9837559630333446}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6322555596718658, "5": 0.3232227709968611, "3": 0.043875811571985085, "2": 0.0005640306296786328, "1": 5.917845607265882e-05}, "score": 4.278047660207984}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6282995222240456, "3": 0.31619046804385414, "5": 0.03226615922465514, "2": 0.020991984596505517, "1": 0.002248886666760833}, "score": 3.6673440709242673}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7316668291998315, "3": 0.2008064038479568, "5": 0.059744687754352634, "2": 0.007203530686707008, "1": 0.0005597244214006519}, "score": 3.8428490910459656}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7510850760092156, "3": 0.23354231447100365, "5": 0.011965449385383712, "2": 0.003291248180445298, "1": 0}, "score": 3.771814189090283}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7087834494943998, "5": 0.2654751074356909, "3": 0.025336247527488684, "2": 0.00031486203475084604, "1": 0}, "score": 4.239530773493666}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7128631303775042, "5": 0.2385889457554288, "3": 0.04822238242722068, "2": 0.000258441808898783, "1": 0}, "score": 4.189862419408684}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7069127708330735, "3": 0.27901394955657144, "5": 0.00914592366548197, "2": 0.004842156982442388, "1": 6.530362566647801e-05}, "score": 3.720246183470635}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"5": 0.574989125809078, "4": 0.386273967853587, "3": 0.03771300438908948, "2": 0.0007240913496413449, "1": 0.00024987744007719844}, "score": 4.535105025884561}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9890488967351729, "4": 0.010559007414086389, "3": 0.0003514577686569827, "2": 2.8523538279823464e-06, "1": 0}, "score": 4.988729094107729}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7321045480605832, "4": 0.2568184150605518, "3": 0.010950716402214157, "2": 5.3101467158208315e-05, "1": 0}, "score": 4.721100426983061}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8746805543723729, "4": 0.12295737849022662, "3": 0.0022680231181063416, "2": 1.2708836742052307e-05, "1": 0}, "score": 4.872458075117591}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8603252272520362, "4": 0.13846636982328508, "3": 0.0011804715519911726, "2": 4.18721383943291e-06, "1": 0}, "score": 4.859156781227455}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.33564326310131914, "1": 0.22584194111147615, "4": 0.20280746465073995, "3": 0.14998703829293397, "2": 0.08569476846421455}, "score": 3.3367239348356494}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5887232911681719, "5": 0.2465057152918559, "3": 0.14048204387178023, "2": 0.016332292435649258, "1": 0.007938647168823323}, "score": 4.049544037333576}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.25639855235318026, "3": 0.2375735545707185, "1": 0.22349833826770035, "2": 0.1486776707309185, "5": 0.13381175234243972}, "score": 2.9283448341256095}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.48974805185550396, "5": 0.40323091139396416, "3": 0.09133023364787879, "2": 0.008920499822923762, "1": 0.006759360459402597}, "score": 4.273784592697636}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6201940041312352, "5": 0.22235677333451895, "3": 0.13022854937643813, "2": 0.019322624804106868, "1": 0.00785424130078461}, "score": 4.029921561222929}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5192207235506727, "5": 0.4180307853527873, "3": 0.06001137208316832, "2": 0.0018126534731115293, "1": 0.0008812440109024085}, "score": 4.351765578136952}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6742585744663497, "4": 0.319007871804059, "3": 0.006687938492082675, "2": 2.761664188789458e-05, "1": 0}, "score": 4.66752741724654}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7498922420807567, "4": 0.23598474874655972, "3": 0.013985844052780097, "2": 7.764961240086505e-05, "1": 0}, "score": 4.735794890009471}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6207085319293003, "4": 0.37360027744571817, "3": 0.005562590288394649, "2": 1.2009278483361203e-05, "1": 0}, "score": 4.615193649162434}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7615543019476518, "4": 0.22338871687527248, "3": 0.014883500925488083, "2": 9.662355556914887e-05, "1": 0}, "score": 4.746534930119218}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6112129949406929, "4": 0.37797207566253443, "3": 0.010671442827385422, "2": 0.00010824006214079031, "1": 2.8332953389906087e-05}, "score": 4.600244222949619}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5056299001212622, "5": 0.47784684776294206, "3": 0.01644340983455092, "2": 5.742005071746367e-05, "1": 0}, "score": 4.461298941178157}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9478030182252354, "4": 0.05077151043112687, "3": 0.0014113804655088787, "2": 3.1129491542446965e-06, "1": 0}, "score": 4.946395801327307}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7592035923048281, "4": 0.23144423962948305, "3": 0.00929382293536674, "2": 4.78221326251213e-05, "1": 5.5928475487818895e-06}, "score": 4.749801043193289}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.512642478385703, "5": 0.45695487260443, "3": 0.03013575917190276, "2": 0.000227179069282022, "1": 1.947104631826941e-05}, "score": 4.426314970651654}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5688170247192565, "5": 0.37564970705583556, "3": 0.05438235686819014, "2": 0.000996385825888591, "1": 8.888661404089318e-05}, "score": 4.3190288594025015}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9749487670307898, "4": 0.024700815986578806, "3": 0.00034543585170426804, "2": 1.516964893382209e-06, "1": 0}, "score": 4.974603673438241}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7387612071159335, "4": 0.24827377754475582, "3": 0.012901657338682081, "2": 4.6576473725088944e-05, "1": 0}, "score": 4.725778576502508}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8716078060075685, "4": 0.1250054428284736, "3": 0.0033580494312211756, "2": 2.2908054141579415e-05, "1": 0}, "score": 4.868208970591793}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5832885063165512, "4": 0.40461515427273403, "3": 0.01202911882269042, "2": 5.598145963466167e-05, "1": 9.205918182675859e-06}, "score": 4.571120968029025}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8065212930237903, "4": 0.19068487167795836, "3": 0.002744634126921912, "2": 2.05257388233941e-06, "1": 0}, "score": 4.803810452284542}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.794895292936537, "4": 0.2011673963221535, "3": 0.0038526386569366087, "2": 4.228336096893152e-06, "1": 0}, "score": 4.791097836482626}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5781912688989398, "4": 0.41504405822038853, "3": 0.006160444776906699, "2": 3.720754826177328e-06, "1": 0}, "score": 4.5723670932581735}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7650265499047415, "4": 0.23200018729734748, "3": 0.002938532417450959, "2": 2.3712863176250687e-06, "1": 0}, "score": 4.762107936037103}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.950914853589304, "4": 0.0487630707269232, "3": 0.00024466221818214616, "2": 1.7238163670883742e-07, "1": 0}, "score": 4.950743283049592}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5897605098481407, "5": 0.3440397073249037, "3": 0.06463845930904881, "2": 0.0012727084647129244, "1": 0.00021719673548778917}, "score": 4.276223968331093}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5200147512606917, "4": 0.4363289096951287, "3": 0.04265220101193692, "2": 0.0007477267157671727, "1": 0.00017276642849704867}, "score": 4.47538856135469}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8607148621164119, "4": 0.13538356594285192, "3": 0.0032802137205649342, "2": 1.3076380113106558e-05, "1": 0}, "score": 4.857930359093092}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5918725822203004, "5": 0.3673072454887507, "3": 0.040476897488937534, "2": 0.0002664806299804765, "1": 0}, "score": 4.326322446401939}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5502621763834277, "4": 0.428690142318974, "3": 0.020770380948018287, "2": 0.00015952945211930342, "1": 0}, "score": 4.529235065019747}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6452723262836445, "3": 0.2743450934250329, "5": 0.07188210734165046, "2": 0.007667265853275172, "1": 0.0008153419191526597}, "score": 3.7797525216923717}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7369233757297985, "5": 0.17784530136958543, "3": 0.08480961145307934, "2": 0.00039014971807829855, "1": 3.0392125886324148e-05}, "score": 4.0921643218984105}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5261722017861131, "3": 0.4460866336381064, "5": 0.013810893695572441, "2": 0.013581068202054703, "1": 0.0003453877013027014}, "score": 3.539524203844946}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5419093567483947, "4": 0.41030487420175044, "3": 0.04744010077655116, "2": 0.0003090127561128482, "1": 2.7738727958138513e-05}, "score": 4.493772417140316}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.65077666509748, "3": 0.2971504508272492, "5": 0.045669038738147885, "2": 0.006086783486036797, "1": 0.0003121236920005844}, "score": 3.7354073432621915}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.838833410031083, "4": 0.16068642242617248, "3": 0.0004615713091144915, "2": 9.25857038766742e-07, "1": 0}, "score": 4.838384801583063}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8916164300840114, "4": 0.10782630862047142, "3": 0.000411047203375812, "2": 4.7201928223617423e-07, "1": 0}, "score": 4.891334343756941}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9180485711608906, "4": 0.0818072179719826, "3": 0.00014245291983047372, "2": 2.3565946945009953e-07, "1": 0}, "score": 4.91790704424084}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9340483831567081, "4": 0.065844195630538, "3": 9.477034633590817e-05, "2": 1.1170794560090481e-07, "1": 0}, "score": 4.933965100530884}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8942489365969939, "4": 0.10517987492222075, "3": 0.000491144095353277, "2": 6.020255203067498e-07, "1": 0}, "score": 4.893827596224197}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7650186625216716, "5": 0.12329534783226614, "3": 0.11121017495030332, "2": 0.0003955051695180065, "1": 4.577836309394171e-05}, "score": 4.011157212725179}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.898682119928284, "4": 0.09980454057062631, "3": 0.0014844009333581073, "2": 3.2123043895798227e-06, "1": 0}, "score": 4.897214376359467}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8796016187307161, "4": 0.11704724760690403, "3": 0.0031832725741315704, "2": 9.580373301375791e-06, "1": 0}, "score": 4.8765379244593445}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8437750654809223, "4": 0.1546012588864603, "3": 0.0015849934565833428, "2": 3.82713146552776e-06, "1": 0}, "score": 4.842211773090295}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7034908562673056, "4": 0.293232872192498, "3": 0.0031947852749484745, "2": 2.15188791742941e-06, "1": 0}, "score": 4.700347328835771}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4880629087814293, "3": 0.36555201427480954, "5": 0.11287656527613096, "2": 0.028717568518449085, "1": 0.004779181411349356}, "score": 3.6755480536116427}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5162741118679988, "4": 0.46760839320738923, "3": 0.01586665407508924, "2": 0.00020867928627598843, "1": 3.987472075074101e-05}, "score": 4.4998716181857645}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5262880460851285, "5": 0.35046171785464547, "3": 0.11298976947362857, "2": 0.007867428634433465, "1": 0.0023843970400517956}, "score": 4.214585754208637}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6377297338771385, "5": 0.3059499048720789, "3": 0.05424037075065094, "2": 0.0018465726125874002, "1": 0.0002286020131984394}, "score": 4.247331773975403}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.39001629058501885, "5": 0.30168145592085754, "3": 0.2672841377759705, "2": 0.03189125642569998, "1": 0.009118818807549266}, "score": 3.9432578926367814}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.872321212450644, "2": 0.09922278535377342, "3": 0.022106683397511363, "4": 0.004279042540093027, "5": 0.0020610714706883223}, "score": 1.1645190800149652}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6035725682639466, "2": 0.24807164088427558, "3": 0.09677045966723193, "4": 0.03250505380640658, "5": 0.019056325219506485}, "score": 1.6153677619022357}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3728598004881937, "5": 0.242629158019859, "3": 0.24018877555683307, "2": 0.097216969443644, "1": 0.0469791402621861}, "score": 3.6670270161730865}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.7210909683219108, "2": 0.12223611937725269, "3": 0.06514113860074283, "5": 0.0633374181794105, "4": 0.028182465083188904}, "score": 1.5904224849275994}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4305377802344085, "5": 0.16924990982188964, "3": 0.16496322643692923, "2": 0.1343322594371379, "4": 0.10085806979343252}, "score": 2.443917397300427}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6244881030239298, "4": 0.3547816674420127, "3": 0.02057025867590273, "2": 0.00012309341737566805, "1": 3.095574357877148e-05}, "score": 4.603582364514537}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5503058854439802, "4": 0.42927078444673317, "3": 0.02031276444796883, "2": 7.181960995858542e-05, "1": 0}, "score": 4.529870012146798}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7012252758652058, "4": 0.2927460410234065, "3": 0.005976536855074883, "2": 1.9405209442078035e-05, "1": 0}, "score": 4.695232691237376}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8633716514695825, "4": 0.13360123151438943, "3": 0.002987795364001825, "2": 6.740273872254084e-06, "1": 0}, "score": 4.860398408523748}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7922685471152964, "4": 0.20328596431664403, "3": 0.004411316976406012, "2": 8.048224901338626e-06, "1": 0}, "score": 4.787861715289626}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8754455694548955, "4": 0.12152914116260817, "3": 0.0029796304387424265, "2": 2.578568667558918e-05, "1": 0}, "score": 4.872431705702374}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9253131391008198, "4": 0.07364414034992459, "3": 0.0010186024889661666, "2": 4.41635439375722e-06, "1": 0}, "score": 4.924303914266944}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7873083208536883, "4": 0.20543021275938367, "3": 0.007144820431260692, "2": 9.200823261252693e-05, "1": 0}, "score": 4.7799987013491885}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8673620066137548, "4": 0.12930157659093108, "3": 0.0030331202616703653, "2": 1.3126059879803242e-05, "1": 0}, "score": 4.864553502131633}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8078194244734498, "4": 0.18896191351938035, "3": 0.0029909506469161496, "2": 1.0201212216302344e-05, "1": 0}, "score": 4.804983163409142}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.594827197492612, "5": 0.2014078343500838, "3": 0.1970013101024535, "2": 0.005911574914910816, "1": 0.0008480832964928851}, "score": 3.990039084686228}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6812215604530774, "4": 0.30231329459889733, "3": 0.01639596518050837, "2": 5.669395311043764e-05, "1": 8.905468782426221e-06}, "score": 4.664687870772311}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8441015176868022, "4": 0.14733561489202107, "3": 0.008509317835079995, "2": 3.0244052632718747e-05, "1": 0}, "score": 4.8355511847125525}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6407097709655243, "4": 0.34431966306540607, "3": 0.014820306171234985, "2": 0.00011396547571975571, "1": 0}, "score": 4.625684242628293}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6071455930069781, "5": 0.23122840285741986, "3": 0.1573775946028369, "2": 0.003883661052490516, "1": 0.00034595640083284415}, "score": 4.065046839312475}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5777172886214936, "4": 0.3996315145808507, "3": 0.022398477302470587, "2": 0.00019951941661086695, "1": 4.733985579682484e-05}, "score": 4.554781004058687}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5253329116129352, "4": 0.43699575407904795, "3": 0.037145806292175274, "2": 0.0003425384992533557, "1": 0.00012201165317069137}, "score": 4.487165699686238}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7418246607546943, "4": 0.2493546496703089, "3": 0.008775737215471235, "2": 2.8637170962303485e-05, "1": 8.634791435886037e-06}, "score": 4.7329713743342285}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8750773644664047, "4": 0.12062975504955514, "3": 0.00424940375002379, "2": 1.585947411899378e-05, "1": 0}, "score": 4.870820291438456}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5949430751679514, "4": 0.35701606436271477, "3": 0.04693923904113978, "2": 0.0008418497532205191, "1": 0.00025589022859350696}, "score": 4.545554583475454}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5162234317261122, "5": 0.3947919151405091, "3": 0.08623669464122645, "2": 0.002440399557522763, "1": 0}, "score": 4.303767847899912}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7397457299547439, "4": 0.2367329420468975, "3": 0.022682113877285526, "2": 0.0007463317884500309, "1": 8.9199421841219e-05}, "score": 4.715305988643172}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.705762147366645, "5": 0.20081979808178615, "3": 0.09234870455439768, "2": 0.000912744648953574, "1": 0}, "score": 4.106662308117386}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8126375961569022, "4": 0.1837506138894143, "3": 0.0035811596730653994, "2": 1.4922133163253077e-05, "1": 0}, "score": 4.809039300726143}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5725915177485837, "4": 0.38962836672311824, "3": 0.03690220402664601, "2": 0.0006390865287499459, "1": 0.00015912889878318365}, "score": 4.533976309783651}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6919196104379963, "4": 0.2990395619889222, "3": 0.008930897368041858, "2": 9.018107179308414e-05, "1": 1.3973135005905311e-05}, "score": 4.682770375201837}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8368568086581184, "4": 0.1554503330484646, "3": 0.007581531916084228, "2": 6.88530523802244e-05, "1": 2.2488398588941023e-05}, "score": 4.829086674677649}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9719628795639186, "4": 0.026770573458355318, "3": 0.0012497954263268904, "2": 1.0629057858192436e-05, "1": 3.501563412216904e-06}, "score": 4.970683865426228}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.957049684451114, "4": 0.041299478756615, "3": 0.0016271683230689232, "2": 1.215413642031361e-05, "1": 0}, "score": 4.9554092087547765}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9611243999023713, "4": 0.03731349580291921, "3": 0.0015181967455620432, "2": 1.1147291548657165e-05, "1": 0}, "score": 4.959615345819637}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5331363880641115, "5": 0.45121388760750836, "3": 0.01563611931957541, "2": 6.864104304616889e-06, "1": 0}, "score": 4.435566976194713}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8368254354844556, "3": 0.08728132993540741, "5": 0.07566431726591698, "2": 0.00021818832324459544, "1": 7.394922070432794e-06}, "score": 3.987924385656879}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4943574205650808, "5": 0.47671009030669514, "3": 0.028871812668725443, "2": 2.9389649600796862e-05, "1": 0}, "score": 4.447793508369138}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6265357520208064, "4": 0.36806152768224054, "3": 0.005397013683277719, "2": 1.9758971689456283e-06, "1": 0}, "score": 4.6211371038296365}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7505012217464141, "4": 0.23812774633555336, "3": 0.011337872596517133, "2": 1.8497369965745755e-05, "1": 0}, "score": 4.739137191603658}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8921690914155264, "3": 0.07150723826003128, "5": 0.035950337745188694, "2": 0.00036031302155304414, "1": 0}, "score": 3.9637220011185517}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6055844828245489, "4": 0.39061904633110245, "3": 0.0037734616095094786, "2": 4.871318101980715e-06, "1": 0}, "score": 4.601812194198304}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6458930992049066, "3": 0.3163287683726927, "5": 0.029352305025489488, "2": 0.008231645047520351, "1": 0.00018641000169318436}, "score": 3.695998653748513}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8833577919970936, "5": 0.06370818065018963, "3": 0.0527325904480664, "2": 0.00012585350325755292, "1": 0}, "score": 4.010724693804445}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7552547873299451, "5": 0.23034145131734066, "3": 0.014346805138445166, "2": 1.8948344343290507e-05, "1": 0}, "score": 4.215964957858236}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9524348150177612, "4": 0.04634345060384056, "3": 0.0011655086241357101, "2": 5.890462738347783e-06, "1": 0}, "score": 4.9513054097032745}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8537783006569848, "4": 0.1247015869792276, "3": 0.019698468251345105, "1": 0.0012331821951280842, "2": 0.0005623832505533231}, "score": 4.829277145761486}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5784784410652807, "4": 0.4103998584635613, "3": 0.011067437948663373, "2": 1.6901317170322524e-05, "1": 0}, "score": 4.567398399170368}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8889410554474847, "4": 0.1091194636641859, "3": 0.0019186067641905312, "2": 8.52129698859781e-06, "1": 0}, "score": 4.887016363249131}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5486947242294352, "5": 0.4244385891539155, "3": 0.02668711805105426, "2": 0.00013441628084125845, "1": 0}, "score": 4.397500586600855}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5111377273229295, "3": 0.4188511972351452, "5": 0.034220852448546446, "2": 0.03271024327930032, "1": 0.00301928026151709}, "score": 3.5408634585335315}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6187689124441818, "3": 0.193003452815795, "5": 0.17349690818731997, "2": 0.013020560421527121, "1": 0.0016837766543770678}, "score": 3.949399669249085}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7692078960842982, "3": 0.11757145530251632, "5": 0.11041910583639968, "2": 0.0026071359430325015, "1": 0.00016726770584752517}, "score": 3.9871312262829797}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5814948054973188, "4": 0.40345708250088624, "3": 0.0149061812956649, "2": 0.0001165748502326836, "1": 1.4549062491450361e-05}, "score": 4.566317947394773}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5720485234465728, "5": 0.3158067509794742, "3": 0.10950604782195943, "2": 0.002377647798421383, "1": 0.0002528530671999227}, "score": 4.200788490183742}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7050292836079175, "4": 0.2888251474778532, "3": 0.006089026879071185, "2": 2.7980380215163065e-05, "1": 0}, "score": 4.698904257830667}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9618208714197367, "4": 0.03781876012005842, "3": 0.000351198488509856, "2": 9.502535435620775e-07, "1": 0}, "score": 4.961475675483202}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9370394267383294, "4": 0.06236955645383602, "3": 0.0005836640485461312, "2": 1.1278132241791309e-06, "1": 0}, "score": 4.936459336472196}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6916685099507244, "4": 0.29831246546019397, "3": 0.009945779387133416, "2": 2.806890999542875e-05, "1": 0}, "score": 4.681697389303882}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8905483485632449, "4": 0.10730999324409538, "3": 0.0021099015317503815, "2": 8.390705104127664e-06, "1": 0}, "score": 4.888442424927722}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6581722393371033, "4": 0.3347028017067235, "3": 0.007039177134131611, "2": 5.2023344886568346e-05, "1": 0}, "score": 4.651050994003306}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9048392548577826, "4": 0.0924450190344109, "3": 0.0026714844160277205, "2": 6.068203260032667e-06, "1": 0}, "score": 4.902190073777658}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7689948396247376, "4": 0.22415594193228647, "3": 0.006779492719240632, "2": 3.6824211791979305e-05, "1": 0}, "score": 4.762166774921161}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7344075420886762, "4": 0.259954126518672, "3": 0.00559951215620027, "2": 9.793477060237938e-06, "1": 0}, "score": 4.728809597230367}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6986128519895468, "4": 0.28598374655627423, "3": 0.015223448124600789, "2": 0.00013699816861489333, "1": 0}, "score": 4.683144752120504}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.49277874439913594, "3": 0.262588844230956, "5": 0.13654613993113415, "2": 0.06919214045837524, "1": 0.03885223402347544}, "score": 3.619000349987077}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5117626477713384, "4": 0.4578704203036546, "3": 0.028980696748132237, "2": 0.0010421758373829024, "1": 0.00033293675864458485}, "score": 4.479704124620417}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5202311223992927, "4": 0.455072814939959, "3": 0.023534225808410685, "2": 0.0008699981262966284, "1": 0.0002674994627610865}, "score": 4.494166429596839}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6220687262397018, "4": 0.3633356195890239, "3": 0.014204506579087237, "2": 0.000297263977735064, "1": 8.302506564801492e-05}, "score": 4.607027207942763}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6395636576956178, "5": 0.26067332081695016, "3": 0.089602370757876, "2": 0.008822864398080214, "1": 0.0013239931436404854}, "score": 4.149455303297064}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6430831418955141, "3": 0.27229751644537575, "5": 0.06898691707302479, "2": 0.014593054246609062, "1": 0.0010323102781386116}, "score": 3.764404697982731}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.48298834309484795, "4": 0.4664313869524106, "2": 0.04109259270000113, "5": 0.009010330739400878, "1": 0.00046434906189426453}, "score": 3.4424365081544557}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7362446430765193, "5": 0.1674622543961664, "3": 0.09450353856984012, "2": 0.0016734013288521134, "1": 0.00011075134551424574}, "score": 4.069280034025958}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6527199359431016, "4": 0.3395877829552214, "3": 0.007629110650857516, "2": 1.855962565982655e-05, "1": 0}, "score": 4.6450824837028195}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7502180210214731, "5": 0.1969560444026201, "3": 0.052419401423991645, "2": 0.0003668755016585824, "1": 0}, "score": 4.14380859508628}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.709551023669652, "4": 0.2855287369886366, "3": 0.004879341532919419, "2": 1.1857582756089646e-05, "1": 0}, "score": 4.704668430701728}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5281480905896044, "5": 0.468043592984342, "3": 0.003693920200137553, "2": 6.432759188596646e-06, "1": 0}, "score": 4.464386944090214}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5554964836419417, "4": 0.43973403532632305, "3": 0.0045317323290247815, "2": 8.958453019119496e-06, "1": 0}, "score": 4.55107291451659}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8488290139078596, "4": 0.15057093152634815, "3": 0.0005889927991141907, "2": 1.4202026290744274e-06, "1": 0}, "score": 4.848245359115447}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7854576165740031, "4": 0.2131399471816397, "3": 0.0013925008162319864, "2": 5.206998353461008e-06, "1": 0}, "score": 4.784058409126189}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4906576720251161, "5": 0.46009577713908967, "3": 0.04855408731712662, "2": 0.0006045668540878072, "1": 7.375498292072349e-05}, "score": 4.410117090910368}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7869444165973808, "4": 0.20533448404852564, "3": 0.007623246119968138, "2": 2.22587804551301e-05, "1": 0}, "score": 4.779335566362867}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6895005252259843, "4": 0.28070303034529126, "3": 0.029353628844298024, "2": 0.0003810821078072093, "1": 5.883980360600204e-05}, "score": 4.659210120293788}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9918305964378326, "4": 0.008060718359067109, "3": 0.00010233344580235254, "1": 6.407522244970653e-07, "2": 0}, "score": 4.991732004521866}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9762849697336218, "4": 0.02340054889131, "3": 0.00030682162662516054, "2": 1.0335965931753362e-06, "1": 0}, "score": 4.975982547922375}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8123766107524455, "5": 0.1662043206845644, "3": 0.021345848667863744, "2": 6.72631513159453e-05, "1": 3.6572465588519936e-06}, "score": 4.144713306742244}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5115936251340609, "5": 0.4792905160968033, "3": 0.009035915788273386, "2": 1.470061835644512e-05, "1": 0}, "score": 4.47025587967639}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5479664809798541, "4": 0.44553948733764853, "3": 0.006456544573748078, "2": 1.4557794548300305e-05, "1": 0}, "score": 4.541493236885575}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6946159472767481, "5": 0.2964336093854183, "3": 0.008935894709655666, "2": 9.099064062551388e-06, "1": 0}, "score": 4.2874810831942325}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5176197394641107, "5": 0.4697240567473727, "3": 0.012627790481578695, "2": 1.53458573474513e-05, "1": 0}, "score": 4.457071547310504}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9792921825294042, "4": 0.020402782303610485, "3": 0.0002938277049493451, "2": 1.49462831613813e-06, "1": 0}, "score": 4.979004874479379}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9664834539842023, "4": 0.032788861817392115, "3": 0.0006337389114105742, "2": 3.0820271866463976e-06, "1": 0}, "score": 4.965931318686785}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.976221236026076, "4": 0.023645865491086156, "3": 0.00010167623090238579, "1": 0, "2": 0}, "score": 4.976150037397568}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977378760674851, "4": 0.002228406105417935, "3": 1.7664439624799078e-05, "1": 0, "2": 0}, "score": 4.997736228674134}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.937937428084516, "4": 0.06181083538701537, "3": 0.00022880189869521283, "2": 8.488435018147832e-07, "1": 0}, "score": 4.937727638951032}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.533887626197226, "4": 0.4356300347508082, "3": 0.030073496802493323, "2": 0.0003580922224961957, "1": 4.148776472918767e-05}, "score": 4.502978140370994}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5796085599064479, "4": 0.39440621431539924, "3": 0.025741160303347586, "2": 0.00015293738021349102, "1": 4.7154552499684515e-05}, "score": 4.553444398095709}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7649219090800524, "4": 0.21725017702333121, "3": 0.017681312289639897, "2": 9.004995374513677e-05, "1": 0}, "score": 4.747102746778387}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.814824896292452, "4": 0.1797932678646788, "3": 0.005348488400282528, "2": 2.3296812717267286e-05, "1": 0}, "score": 4.809437949627969}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8449940441440835, "4": 0.15353713797695406, "3": 0.0014624527310941058, "2": 3.7302212862346516e-06, "1": 0}, "score": 4.843526353600428}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.525314861484195, "3": 0.44170351611368897, "5": 0.02636213443841969, "2": 0.006371718917745327, "1": 0.0002432692994660469}, "score": 3.571183443025047}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5764572191033183, "4": 0.4035927112526987, "3": 0.019892655216065633, "2": 4.514906441596639e-05, "1": 7.2181562839777705e-06}, "score": 4.556455419835379}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5235720116819962, "5": 0.41278677608735925, "3": 0.06330797312646244, "2": 0.00026590512120761446, "1": 4.6992337568620836e-05}, "score": 4.348813111138395}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912031274066667, "4": 0.008523212118307498, "3": 0.00026954343817262174, "2": 1.0453017063572133e-06, "1": 0}, "score": 4.990934537253528}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6428875843286846, "4": 0.31211833007931117, "3": 0.044603925862817494, "2": 0.00029749652908137806, "1": 7.371089062584702e-05}, "score": 4.597478856340019}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8229283431147588, "5": 0.13820512284397732, "3": 0.03860267902990281, "2": 0.00019257324174536583, "1": 0}, "score": 4.099224370219282}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7485252436798275, "5": 0.2277853820803866, "3": 0.023618697823085184, "2": 6.0757866160652155e-05, "1": 0}, "score": 4.20404719237737}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5153836830879917, "5": 0.470692859805828, "3": 0.013851684904409894, "2": 6.137548927421881e-05, "1": 0}, "score": 4.456723172342382}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7000636636519804, "5": 0.29107945728279233, "3": 0.008823532314195455, "2": 1.6062165828124347e-05, "1": 0}, "score": 4.2822286788425865}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.717168929597564, "5": 0.2581027803346537, "3": 0.024545974737437214, "2": 0.00010005365158493531, "1": 0}, "score": 4.23337589618705}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5172789990667621, "4": 0.45657897171938305, "3": 0.02558332773526417, "2": 0.0004550012007526467, "1": 9.996444352043325e-05}, "score": 4.49048760797987}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6761033702894901, "4": 0.3194514732856449, "3": 0.004413873192666997, "2": 2.504617341465703e-05, "1": 3.1000943855036852e-06}, "score": 4.671632211353173}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5777264166267649, "5": 0.40139945514799735, "3": 0.02073909733563272, "2": 0.00011332157323270247, "1": 0}, "score": 4.380441973801069}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8232250540306141, "4": 0.17410853671669704, "3": 0.0026470284705894073, "2": 1.2157284749337478e-05, "1": 0}, "score": 4.820559638300899}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6168266628251944, "4": 0.3771348172583141, "3": 0.0060132031642103805, "2": 2.0964815033781508e-05, "1": 2.2458892786306726e-06}, "score": 4.61076607866574}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5331363880641115, "5": 0.45121388760750836, "3": 0.01563611931957541, "2": 6.864104304616889e-06, "1": 0}, "score": 4.435566976194713}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9877506032098609, "4": 0.012101517754372475, "3": 0.0001471011665601231, "2": 9.477046754556587e-08, "1": 0}, "score": 4.9876039871334035}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5260270456398554, "4": 0.46608390845654124, "3": 0.00787574575268841, "2": 3.7208701713647804e-06, "1": 0}, "score": 4.518148821639853}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6265357520208064, "4": 0.36806152768224054, "3": 0.005397013683277719, "2": 1.9758971689456283e-06, "1": 0}, "score": 4.6211371038296365}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6517430172977426, "4": 0.3374266249032855, "3": 0.010814582760775179, "2": 1.0791055083692265e-05, "1": 0}, "score": 4.64091004671165}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7776802725530313, "5": 0.1729965027511434, "3": 0.0486488844853227, "2": 0.0005810764071699867, "1": 4.8580905267112736e-05}, "score": 4.123045220752736}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6508789947569686, "4": 0.3423864873529039, "3": 0.00667667146033158, "2": 5.240120346561306e-05, "1": 4.00616152806336e-06}, "score": 4.644086429287231}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7591979514430931, "4": 0.2373398971713148, "3": 0.003439074102760939, "2": 1.6785972341791643e-05, "1": 0}, "score": 4.755730059928102}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6301259682378019, "4": 0.36661940962895984, "3": 0.003231640099100823, "2": 4.723393758991572e-06, "1": 0}, "score": 4.626896327625784}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7340190845179353, "5": 0.24104573300212545, "3": 0.024805105005470694, "2": 8.784822046966683e-05, "1": 0}, "score": 4.2160740562019186}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5334657014487845, "5": 0.42598653550842774, "3": 0.0403968608001762, "2": 0.00013861323294116657, "1": 1.1655306361255632e-05}, "score": 4.385277726475055}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7193657413479534, "5": 0.23257656414830644, "3": 0.04782565825136958, "2": 0.00021592444567760364, "1": 1.2907719690005648e-05}, "score": 4.184280924298626}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6074932104766566, "4": 0.38280953926645367, "3": 0.009655778833657667, "2": 3.1155087606988974e-05, "1": 0}, "score": 4.597781288380187}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9741846200457697, "4": 0.025643319234104373, "3": 0.00017048913288787173, "2": 5.438877245969911e-07, "1": 0}, "score": 4.9740140441311915}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.995573769758889, "4": 0.004389203515081825, "3": 3.62084876914829e-05, "2": 1.3260566999043166e-07, "1": 0}, "score": 4.995537978633218}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5811576014291928, "3": 0.3625917258022249, "5": 0.04890719286327329, "2": 0.0068419602646990286, "1": 0.0004908583326547931}, "score": 3.6711554656208354}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6892599246361233, "4": 0.30330805705544406, "3": 0.0073896788673003975, "2": 3.175669464156158e-05, "1": 0}, "score": 4.681813947843703}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6370454601142284, "4": 0.323497238952605, "3": 0.03928315413370751, "2": 0.00014843416965432097, "1": 1.5470663574809134e-05}, "score": 4.597425144458643}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8371359218334504, "4": 0.159235968229598, "3": 0.0036141654773272427, "2": 8.442602025583846e-06, "1": 0}, "score": 4.83350945700241}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7121245735665584, "4": 0.2816720579008103, "3": 0.006168423402835393, "2": 1.557675218155602e-05, "1": 0}, "score": 4.705938669546084}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9953506269534399, "2": 0.004480834399541258, "3": 0.00015530292398636207, "5": 6.483837604358712e-06, "4": 6.453886825807187e-06}, "score": 1.0048367386997499}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7912535650036991, "2": 0.17754196064575828, "3": 0.027145841823606184, "4": 0.0032386976171659807, "5": 0.0008153176223254934}, "score": 1.2448121380017818}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9939492774996046, "2": 0.005764700949886967, "3": 0.00026009801947860493, "5": 1.5463471388559745e-05, "4": 9.802589230406331e-06}, "score": 1.0063761628342278}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9616916402318358, "2": 0.03573482769733021, "3": 0.0023107179543238564, "4": 0.00019129706959685085, "5": 7.084487006671113e-05}, "score": 1.0412135619978375}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9920162706171186, "2": 0.007691272765438201, "3": 0.0002686513810766338, "4": 1.2477194749215929e-05, "5": 1.0219233254752258e-05}, "score": 1.0083068932556107}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6039363303086376, "4": 0.3512263119136722, "3": 0.04360670744402889, "2": 0.0011211133779471963, "1": 0.00010071558536069393}, "score": 4.557790169826299}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7758724817065024, "4": 0.21719068034828612, "3": 0.0068733181368323785, "2": 5.174343467761642e-05, "1": 7.3949294653585564e-06}, "score": 4.768876860703008}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6761896939171265, "5": 0.22626805465631422, "3": 0.09518971297582701, "2": 0.002230541272206514, "1": 0.00011988639163442057}, "score": 4.126257866464621}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9256082037241867, "4": 0.07386207324663062, "3": 0.0005269965794769749, "2": 1.384461918931078e-06, "1": 0}, "score": 4.925079679666505}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5107059473039138, "5": 0.47664809819057546, "3": 0.012509652908651627, "2": 7.402127545007229e-05, "1": 0}, "score": 4.464019302002293}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4701638161526944, "4": 0.46578125729864867, "3": 0.05967142597776945, "2": 0.002881801959813252, "1": 0.001492699579543906}, "score": 4.400254289417638}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9025229407360902, "4": 0.09181735012782624, "3": 0.005495289545368573, "2": 9.008183707177838e-05, "1": 4.68946481951878e-05}, "score": 4.896731412666709}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6920685275610703, "4": 0.28190757781686626, "3": 0.025495431493141974, "2": 0.0004563237601736988, "1": 6.128950113003028e-05}, "score": 4.665483800455328}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8274871504571014, "4": 0.15910116837715885, "3": 0.012947565510194211, "2": 0.00034662006202524384, "1": 0.00010658614782847816}, "score": 4.813535461600308}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.45013206567347547, "5": 0.438709550958299, "3": 0.10074003411708088, "2": 0.0072098942133869345, "1": 0.0031960957250791637}, "score": 4.313965321634787}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.666681738909153, "4": 0.32156698677799794, "3": 0.011604511895327917, "2": 9.633912877840964e-05, "1": 0}, "score": 4.654917571854096}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7831581216658771, "4": 0.21483246224415353, "3": 0.0019898699383394595, "2": 5.3410355530544006e-06, "1": 0}, "score": 4.7811686662480115}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7288980178276397, "4": 0.2687077288261708, "3": 0.0023750471240193936, "2": 8.155924192388153e-06, "1": 0}, "score": 4.726514687059012}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7790622080574923, "4": 0.2192221236370774, "3": 0.0016926915225889915, "2": 3.9687514855248725e-06, "1": 0}, "score": 4.777376355426072}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7116998965735655, "4": 0.2863399035177405, "3": 0.001920473132735388, "2": 3.221227692856039e-06, "1": 0}, "score": 4.709798892583177}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7897127557153697, "2": 0.20134417939484145, "3": 0.008642904358920345, "4": 0.0002462328315343661, "5": 5.042704094900517e-05}, "score": 1.2195711634147155}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4868015664610351, "1": 0.2751538728945793, "3": 0.20939310677973086, "4": 0.025481947976586664, "5": 0.003144307197688357}, "score": 1.9946359162635048}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9776490098462144, "2": 0.021165971601821296, "3": 0.001109905280701819, "4": 4.707092740822217e-05, "5": 2.8002129419061724e-05}, "score": 1.023639004413755}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8170046847912152, "2": 0.15957831087091717, "3": 0.020467203565483736, "4": 0.002252035961810099, "5": 0.0006967120919801112}, "score": 1.2100558953849823}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7006617313375358, "2": 0.25709325499549535, "3": 0.038363798939269673, "4": 0.003055035702034071, "5": 0.0008226155490703112}, "score": 1.346277656128741}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8068552377602456, "3": 0.17365003469389367, "5": 0.018807576218110487, "2": 0.0006751605793844459, "1": 8.36985497814075e-06}, "score": 3.843781545150144}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6369087393500668, "4": 0.349103688216, "3": 0.01386007325334804, "2": 0.00010144741221520414, "1": 0}, "score": 4.622861997928785}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.770676044086267, "5": 0.12087395143914706, "3": 0.10732803357020662, "2": 0.0010640701072082853, "1": 5.620161864314137e-05}, "score": 4.011249191912979}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7517207252550978, "5": 0.23784780134946198, "3": 0.01040971993682563, "2": 1.4161989190640832e-05, "1": 0}, "score": 4.227411483821581}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8403132583983002, "3": 0.08592793492558087, "5": 0.07332359687492306, "2": 0.0004216754565984533, "1": 1.1093502293623234e-05}, "score": 3.9865189976242634}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8738980043193538, "4": 0.09427447544006008, "3": 0.02478419815649632, "1": 0.004750980315589982, "2": 0.0022770421064468305}, "score": 4.830319484610704}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9573064493803807, "4": 0.026497364599786685, "3": 0.00795073421891353, "1": 0.007178154230007653, "2": 0.00103336583854236}, "score": 4.925785934314914}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.995250242942257, "4": 0.002699623392391872, "1": 0.0012947948673092697, "3": 0.0006910288389316342, "2": 5.588922227832538e-05}, "score": 4.990571392397849}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9722412322368053, "4": 0.024684617564954797, "3": 0.0024456092624527744, "1": 0.0004680765532982581, "2": 0.00015605625605246939}, "score": 4.9680835482370345}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955769628677614, "4": 0.003994950860858988, "3": 0.00033250488707714624, "1": 7.70433736920153e-05, "2": 1.1299580012184606e-05}, "score": 4.994997930923052}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8801683614320833, "3": 0.0709085188237222, "5": 0.04798129651247365, "2": 0.0008976704851879125, "1": 3.1538863837047136e-05}, "score": 3.9751825070819202}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.814045327207357, "5": 0.12649990775807574, "3": 0.059100535127514675, "2": 0.0003355570068135124, "1": 9.779335705475331e-06}, "score": 4.066699513806249}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6835829291766927, "5": 0.2883220772268459, "3": 0.027926575964669013, "2": 0.0001506613432252707, "1": 0}, "score": 4.260098796965021}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8697269562356111, "3": 0.07641975063914859, "5": 0.05327230440633724, "2": 0.0005516272563574828, "1": 1.5637721775275465e-05}, "score": 3.975702052630417}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.76809732392698, "5": 0.18839197750344516, "3": 0.04329805777762141, "2": 0.00018155262525084895, "1": 0}, "score": 4.144735314030894}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8104925578662598, "4": 0.17551615307469742, "3": 0.013844164096798478, "2": 8.425530696779217e-05, "1": 3.2167111801326035e-05}, "score": 4.796407833566256}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4680186188445363, "5": 0.3409954653093814, "3": 0.18530410364194833, "2": 0.004517416587381808, "1": 0.0011600091337180406}, "score": 4.143177129135563}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5950929304511668, "4": 0.3626521023507792, "3": 0.04175913705554402, "2": 0.0003584565875346915, "1": 0.00010945522461049161}, "score": 4.552303933950411}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5239628993158925, "4": 0.4412832718285001, "3": 0.034604612380779914, "2": 0.00012688276602401292, "1": 1.1609765042151959e-05}, "score": 4.4890749369200575}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5400179495871765, "5": 0.27528336325199404, "3": 0.1799212902705138, "2": 0.0041676497965587155, "1": 0.0005819165531383666}, "score": 4.085283397211998}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5675749317595811, "5": 0.4004417364841363, "3": 0.03158667261632108, "2": 0.000374894651798129, "1": 1.576002322292149e-05}, "score": 4.368060204499145}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6575366993407941, "5": 0.3113587794663652, "3": 0.030927398657777966, "2": 0.00014208359164599236, "1": 1.9492300822026183e-05}, "score": 4.280093091230011}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7198098781259017, "5": 0.26066406707831596, "3": 0.01947997430137268, "2": 3.47048538635472e-05, "1": 0}, "score": 4.241117425934383}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6186050222674876, "5": 0.3744079727002719, "3": 0.006921830646820638, "2": 7.249993395961266e-06, "1": 0}, "score": 4.367492928871137}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8510762959177862, "5": 0.13240230847757456, "3": 0.016466351225269613, "2": 3.4983221399640585e-05, "1": 0}, "score": 4.115868315262081}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6704398161138065, "3": 0.27827559706827293, "5": 0.03285409119833382, "2": 0.017026021989438353, "1": 0.0014005484066879294}, "score": 3.7163236914382187}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9231365757799032, "4": 0.07582569951974975, "3": 0.000746375300861672, "2": 3.4904880120238364e-06, "1": 0}, "score": 4.922648812185765}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7958795688489118, "4": 0.20307754049330348, "3": 0.0008864350506963023, "2": 2.3808118857156937e-06, "1": 0}, "score": 4.795110878720246}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9740803099415177, "4": 0.025766275326970522, "3": 8.88403161766187e-05, "2": 2.2540568811757202e-07, "1": 0}, "score": 4.974053698204788}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7421977217134527, "5": 0.2410032162849086, "3": 0.016685074528370723, "2": 8.716000417390547e-05, "1": 0}, "score": 4.224149835120965}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5465268181592662, "4": 0.44026711795974766, "3": 0.013108085833373136, "2": 4.870031790858572e-05, "1": 0}, "score": 4.53334761384963}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7640931142129218, "4": 0.22599131718122567, "3": 0.00986393601362414, "2": 2.037055667337592e-05, "1": 0}, "score": 4.754212015288789}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9171213663102384, "4": 0.08149142328824849, "3": 0.0012953906099585368, "2": 4.183384291055398e-06, "1": 0}, "score": 4.915897874930877}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9514735631737772, "4": 0.047847447800896226, "3": 0.000623473247962279, "2": 1.561485416006754e-06, "1": 0}, "score": 4.950898271997963}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9304928750955714, "4": 0.06866703738943312, "3": 0.0007716840140147826, "2": 1.230392910695591e-06, "1": 0}, "score": 4.929781186587864}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6549434650321995, "5": 0.3079181432500447, "3": 0.03655459070461473, "2": 0.0005228384670599007, "1": 5.739496363722642e-05}, "score": 4.270146654490861}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.769087832102957, "4": 0.22006174784237506, "3": 0.010731539032066306, "2": 9.815261448010417e-05, "1": 1.3854755872192306e-05}, "score": 4.758123634652539}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6521735966263418, "4": 0.33700743047014986, "3": 0.0107204247706146, "2": 7.418890108826375e-05, "1": 1.4087255986868005e-05}, "score": 4.641269119386478}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9228309998481276, "4": 0.07584311109913235, "3": 0.0013136628168898797, "2": 4.939057670104864e-06, "1": 0}, "score": 4.92151417415388}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6535324444126814, "4": 0.3336147816422549, "3": 0.012744187419413347, "2": 8.304640583198276e-05, "1": 1.656666523414377e-05}, "score": 4.640578212385399}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5679893559279738, "5": 0.328654280455049, "3": 0.09864303027977846, "2": 0.003969558498155088, "1": 0.0007385856384657626}, "score": 4.219857517148318}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4897082614427981, "5": 0.2615286869406622, "3": 0.22502393604808357, "2": 0.01924297538328705, "1": 0.004470336024123636}, "score": 3.9846073948603715}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5357149334323525, "5": 0.24945199178515326, "3": 0.19759567135628237, "2": 0.015079084919112572, "1": 0.0021547934648417423}, "score": 4.015233823895994}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5837947928553897, "4": 0.3235553119188898, "3": 0.08673860701665359, "2": 0.004277089175256347, "1": 0.0016206369953780172}, "score": 4.483646655736621}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9140170714200057, "4": 0.08021277399878816, "3": 0.005641603191796598, "2": 6.433787914106534e-05, "1": 3.199438945716976e-05}, "score": 4.90818007006495}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.45249285772494324, "3": 0.4200997482790124, "5": 0.08776425321727166, "2": 0.035510864040795655, "1": 0.004117846279479772}, "score": 3.5842832390347628}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5300368958752548, "3": 0.3157253149200278, "5": 0.13218348284875128, "2": 0.020362522501673967, "1": 0.0016878894106033243}, "score": 3.770668561575193}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6832104574861468, "5": 0.21923521158853002, "3": 0.09662410835581749, "2": 0.0008331528826870252, "1": 6.175933004645503e-05}, "score": 4.120763783689486}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.691705390698907, "4": 0.2886593805486361, "3": 0.01945573682432766, "2": 0.00014744998860255615, "1": 2.0317926150196406e-05}, "score": 4.671901677503178}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6850821780221084, "3": 0.22365493133631412, "5": 0.07061575505217796, "2": 0.018967803307014443, "1": 0.0016691869957255426}, "score": 3.8040156677974277}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8303383837582504, "5": 0.10775460641077596, "3": 0.061066209609427685, "2": 0.0007868643404069328, "1": 3.80360562281688e-05}, "score": 4.04500127546425}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7917280716499824, "3": 0.1564629246911203, "5": 0.04492598594890864, "2": 0.0064871070672047094, "1": 0.00039220546895416545}, "score": 3.874311765019758}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.755858749156048, "3": 0.21108275892749112, "5": 0.02520754813873067, "2": 0.007487125002000877, "1": 0.0003586369365521969}, "score": 3.7980735820473575}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5867305813906152, "5": 0.3987335139754399, "3": 0.01446823098190538, "2": 5.298238808071606e-05, "1": 0}, "score": 4.384164962086235}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9025051612092866, "3": 0.06135724634299352, "5": 0.035632020255626354, "2": 0.00048221378736424027, "1": 1.8938077123324414e-05}, "score": 3.973253413877861}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.844740398108862, "5": 0.11490598577115176, "3": 0.04009065957924414, "2": 0.00023783224161317375, "1": 2.396747152651328e-05}, "score": 4.074267845209195}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.688337175796328, "4": 0.3049133930229613, "3": 0.006707862051540496, "2": 2.4070585056605103e-05, "1": 0}, "score": 4.681593099461593}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7178133657532593, "4": 0.2741443188846243, "3": 0.007980849656042531, "2": 2.442772012031885e-05, "1": 0}, "score": 4.709809950587956}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5910872448804577, "4": 0.40184443615337984, "3": 0.0070175606997304185, "2": 1.405774596313738e-05, "1": 0}, "score": 4.5840630041050385}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6433806109037723, "4": 0.3469507291635774, "3": 0.009629804062040715, "2": 2.9927493051460357e-05, "1": 4.380305881742807e-06}, "score": 4.633680692963195}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5950379761565934, "4": 0.3551426994476707, "3": 0.04841720757672895, "2": 0.0010856355533781616, "1": 0.0002910431558204256}, "score": 4.543590195912741}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6955605790318702, "5": 0.1666380473288233, "3": 0.13108691532766964, "2": 0.00529124876253096, "1": 0.0014081301351283042}, "score": 4.020744556886468}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7747946674180656, "4": 0.21049124882537962, "3": 0.014537918121047076, "2": 0.00013106318798846686, "1": 3.262117306145526e-05}, "score": 4.759906244000251}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5293109566859627, "4": 0.3627891744784048, "3": 0.10274948888226647, "2": 0.003849380702941694, "1": 0.0012755872731833593}, "score": 4.415046491730265}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5642636342979986, "5": 0.3458866703220392, "3": 0.08933057182713544, "2": 0.0004588552762084864, "1": 5.595056639626163e-05}, "score": 4.2554716392958065}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6579555717981524, "4": 0.32605848886885497, "3": 0.015884873099382427, "2": 8.157766880933537e-05, "1": 0}, "score": 4.6419200534617095}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7335773966942852, "4": 0.26331403755013566, "3": 0.0030967890333241663, "2": 6.9217633599083295e-06, "1": 0}, "score": 4.730470310537573}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7958995775127805, "5": 0.17184652448683468, "3": 0.03212915518020786, "2": 0.00011327670677384746, "1": 0}, "score": 4.139492415328932}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6649299381779584, "4": 0.3306718781352176, "3": 0.00438620451950276, "2": 8.69291701586493e-06, "1": 0}, "score": 4.660528518486469}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5636071571779544, "5": 0.41785102897138793, "3": 0.018430595433164835, "2": 6.895668528341256e-05, "1": 0}, "score": 4.39929939525177}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6007973435880256, "4": 0.3723881107906944, "3": 0.02564268328767314, "2": 0.0007248549442675441, "1": 0.0004373509482188677}, "score": 4.572398424898848}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7865185431231022, "2": 0.16351600557679888, "3": 0.03664366561876592, "4": 0.00908525054171701, "5": 0.004234003837146649}, "score": 1.2809958150734688}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.3985122663184014, "5": 0.3296669752438883, "3": 0.24971293022436505, "2": 0.014272887790889473, "1": 0.007804565468836427}, "score": 4.027995423390922}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5898738373195243, "4": 0.2910956417505413, "3": 0.10340525460177757, "1": 0.008825035972209818, "2": 0.006784972762997308}, "score": 4.446430340727543}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.49993211488877815, "4": 0.45931685094693275, "3": 0.03940916009417176, "2": 0.0009133197679226537, "1": 0.00042632064799655295}, "score": 4.4574183750292455}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6001763201618528, "5": 0.2919129025926841, "3": 0.10654450433934988, "2": 0.0012019709634794042, "1": 0.00010409381480569951}, "score": 4.182663172689609}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9672549633608496, "4": 0.03204790065323439, "3": 0.0006930128613499843, "2": 1.888074559047111e-06, "1": 0}, "score": 4.9665603346610645}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9170765421817596, "4": 0.08179264122456674, "3": 0.0011165563698057048, "2": 3.252238595890703e-06, "1": 0}, "score": 4.915963564248187}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9325655696105214, "4": 0.06683327458041796, "3": 0.0002864937033176108, "2": 1.6111877677776218e-07, "1": 0}, "score": 4.932572048499321}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5121368164553922, "5": 0.4675544997699266, "3": 0.01983566894696932, "2": 2.775096343489234e-05, "1": 0}, "score": 4.447862745993035}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5183156807747308, "4": 0.3481758885586989, "3": 0.09440130327941279, "1": 0.021928695566789298, "2": 0.01713956577752666}, "score": 4.32386174646441}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.797034901547129, "4": 0.19130076568665574, "3": 0.011118065178919712, "2": 0.00033201845607683787, "1": 0.00018913084137767714}, "score": 4.7847051173825}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6321478577890269, "4": 0.34383836541876145, "3": 0.022466690250657652, "2": 0.0009341262103594561, "1": 0.0005944339201427044}, "score": 4.606040841118959}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8417837724795346, "4": 0.14609381428989482, "3": 0.010856475030409263, "1": 0.0006574755374524537, "2": 0.0005967161609052484}, "score": 4.827771161930403}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7315322587800893, "4": 0.2569654086084929, "3": 0.010976309615359512, "2": 0.0003605909660717007, "1": 0.000157666581233501}, "score": 4.719367353699206}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9055886579139096, "4": 0.09263706013083474, "3": 0.0017659323225262683, "2": 4.087095446387273e-06, "1": 0}, "score": 4.903818403960133}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9697401848822044, "4": 0.02999177804648067, "3": 0.0002557014512722045, "2": 6.113281203928043e-07, "1": 0}, "score": 4.96949462741272}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8948288124567112, "4": 0.10330575426534404, "3": 0.0018334066230532233, "2": 4.268461927267183e-06, "1": 0}, "score": 4.893011657299707}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9539398660605988, "4": 0.045864893594264496, "3": 0.00018526200343811134, "2": 2.719441833447166e-07, "1": 0}, "score": 4.953763317774691}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9716820802067117, "4": 0.02818224244259418, "3": 0.0001233963531511234, "2": 1.8521380064296767e-07, "1": 0}, "score": 4.97157006532736}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6981556198466233, "5": 0.23398489897540586, "3": 0.06608816467312426, "2": 0.0014182422872336849, "1": 0.0003467294725808964}, "score": 4.164021101982144}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6388525259826324, "4": 0.3235657952808255, "3": 0.0339153352373264, "2": 0.002490468085570042, "1": 0.0011591607814009294}, "score": 4.59648874231993}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6613479620597819, "4": 0.3145306975917581, "3": 0.02293714339729807, "2": 0.0007953075203932983, "1": 0.00038731521012875375}, "score": 4.635659258659237}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.671858544414686, "4": 0.31638438385863055, "3": 0.011510637168053917, "2": 0.00016392672971533254, "1": 6.72455979242691e-05}, "score": 4.659828387446692}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5487016652615987, "4": 0.42316353799781575, "3": 0.02727316028864587, "2": 0.0006133540005795362, "1": 0.00023372438001882412}, "score": 4.519508186868984}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5858217597040707, "5": 0.4023234950166666, "3": 0.01180762582368108, "2": 2.60251026288332e-05, "1": 0}, "score": 4.390472055743089}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9860949912596246, "4": 0.013874306535806282, "3": 2.3120104367617005e-05, "2": 4.876056231981608e-08, "1": 0}, "score": 4.986079202103673}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9704731042977569, "4": 0.029347811531575823, "3": 0.00016870363863040328, "2": 5.328877688296817e-07, "1": 0}, "score": 4.97031289017976}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7716486647652319, "4": 0.22718275438765106, "3": 0.001147796800270936, "2": 2.0272628996795972e-06, "1": 0}, "score": 4.770511265752502}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8154264100896713, "4": 0.18171039418777762, "3": 0.0027747794844619794, "2": 1.2338994818211837e-05, "1": 0}, "score": 4.812688779737573}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9934668749675144, "4": 0.00645553743135372, "3": 7.248767576512787e-05, "1": 1.4007174336428764e-06, "2": 0}, "score": 4.9933938599098955}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9904192486623569, "4": 0.009410346533251995, "3": 0.0001488686774560059, "1": 4.845214699408292e-06, "2": 0}, "score": 4.990272372890068}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998507200335539, "4": 0.001422276246918029, "3": 5.234856671052996e-05, "1": 1.2565545169088485e-05, "2": 0}, "score": 4.998422755591739}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9578277249505832, "4": 0.04054597757547874, "3": 0.0015652769590633034, "1": 2.6621004790791124e-05, "2": 2.5248343710958366e-05}, "score": 4.956140838093612}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9880875428856484, "4": 0.011175365858530784, "3": 0.0006520195577098546, "1": 5.243202443372748e-05, "2": 0}, "score": 4.987310452745633}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9112193147736642, "4": 0.0875438647328932, "3": 0.0008513255096499171, "2": 5.258772097533111e-06, "1": 0}, "score": 4.910703754265318}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8677121879583197, "4": 0.13152418867281904, "3": 0.000646376956740316, "2": 1.3115131644302523e-06, "1": 0}, "score": 4.8671637225138}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9837517857543239, "4": 0.016144184290799418, "3": 4.894545711176888e-05, "1": 0, "2": 0}, "score": 4.983757030059136}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.968727478097803, "4": 0.03116405287019235, "3": 8.431025934046199e-05, "2": 2.3788844301248456e-07, "1": 0}, "score": 4.968665863405544}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9649305781228575, "4": 0.03499587785500837, "3": 5.8256376715459384e-05, "2": 1.7244991335485782e-07, "1": 0}, "score": 4.964886561295329}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5853434909772364, "3": 0.3321195780711366, "5": 0.058240988637848566, "2": 0.019553139836477832, "1": 0.004721933138458818}, "score": 3.6728425039177397}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8422898028922329, "4": 0.15670324836514793, "3": 0.0009998262940707592, "2": 2.1777093292595777e-06, "1": 0}, "score": 4.841289781138079}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6881391559126144, "5": 0.27340143663664607, "3": 0.03824681462328489, "2": 0.00016864746967139017, "1": 0}, "score": 4.234827646658968}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8673228200835265, "4": 0.13121968180046834, "3": 0.0014347193841616893, "2": 4.757582009426658e-06, "1": 0}, "score": 4.865894189944283}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7593265173169335, "4": 0.2313077971953792, "3": 0.00912100302620342, "2": 0.00013410653990490425, "1": 7.98693806133453e-05}, "score": 4.74972071439891}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6332451810493841, "3": 0.3264955695117955, "4": 0.02132641998528847, "1": 0.018547523553496207, "5": 0.00038385933023649024}, "score": 2.3517529727548134}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8372936614718791, "5": 0.13497149108404025, "3": 0.02760615841971475, "2": 0.00011402235868325889, "1": 1.2457384230384979e-05}, "score": 4.1071001524086475}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8611128281433751, "5": 0.08437517970117564, "3": 0.05412725666223733, "2": 0.0003514875735394739, "1": 3.187208530750097e-05}, "score": 4.029449372153395}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5623282808496706, "4": 0.4324879777960065, "3": 0.005167005320344259, "2": 9.725949872156724e-06, "1": 0}, "score": 4.5571457292680035}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8372608402036504, "5": 0.08337830794759742, "3": 0.07879026739201027, "2": 0.000532090111738074, "1": 3.3640125237227574e-05}, "score": 4.003422956572183}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5549015879320133, "3": 0.28655233194891583, "5": 0.12917355386928306, "2": 0.028127360305653888, "1": 0.0012382271996884985}, "score": 3.7826503115760506}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7770315224528652, "3": 0.1236558963926528, "5": 0.09581922841515916, "2": 0.003376334248136072, "1": 9.363390567090985e-05}, "score": 3.9651289463640853}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7910514809158583, "5": 0.11674711425973237, "3": 0.09083988751696541, "2": 0.0012975073217148469, "1": 5.182333642566977e-05}, "score": 4.023157024296595}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7260112052847014, "5": 0.2133717989439961, "3": 0.05945769664818314, "2": 0.0010890287881296066, "1": 5.9380658446420526e-05}, "score": 4.151559553178727}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6819324315639335, "3": 0.23765479485626165, "5": 0.0654398224410804, "2": 0.01431944750853714, "1": 0.0006475634998063855}, "score": 3.797202237423175}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9376127609722823, "4": 0.060359012825251634, "3": 0.0020047386015794935, "2": 1.3013542655622038e-05, "1": 9.62968541378378e-06}, "score": 4.93555389618543}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8988773978057247, "4": 0.07874162942041492, "3": 0.0211381185928618, "2": 0.0007085352124985651, "1": 0.0005324609480847632}, "score": 4.874726451203215}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5114251492887182, "5": 0.4566077097042379, "3": 0.03160861085809795, "2": 0.00032601505391837316, "1": 3.061960707855868e-05}, "score": 4.424256014089229}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9192935907660974, "4": 0.07802861192524242, "3": 0.002642169285977515, "2": 2.2791611645148086e-05, "1": 1.217470645206056e-05}, "score": 4.916569920635992}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5648922353056693, "5": 0.4044270115204704, "3": 0.030462708974405416, "2": 0.00016142853838627724, "1": 0}, "score": 4.373662600624443}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5578145608834102, "4": 0.4207442256292706, "3": 0.02066609178183581, "2": 0.0005604691820081441, "1": 0.00020865737610123385}, "score": 4.535404768439747}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7781357532397295, "4": 0.21456421817279114, "3": 0.006887700460182266, "2": 0.00021144407822390216, "1": 0.000184005667352651}, "score": 4.770286148804695}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.704466993288004, "4": 0.23803996481899642, "3": 0.03240785653275084, "1": 0.014990269325765249, "2": 0.010078206084344829}, "score": 4.606942058580803}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8884943370632792, "4": 0.11081469357151662, "3": 0.0006828754993514286, "2": 3.9393059696723e-06, "1": 0}, "score": 4.887807271400463}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.889192158973023, "4": 0.10636468128393133, "3": 0.0042131432275204555, "2": 0.00012221460514463445, "1": 0.00010309259427764521}, "score": 4.884429473810344}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9813726000147653, "2": 0.01413725171290058, "3": 0.0025683952280312204, "5": 0.001302838413053922, "4": 0.0006183140858999138}, "score": 1.0263403538974551}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9831234556785708, "5": 0.014271589017195599, "2": 0.0018009823733180197, "3": 0.0005434204653575697, "4": 0.0002596289660015583}, "score": 1.0607531223763018}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9973343247388893, "2": 0.0010962878369300808, "5": 0.0010862264084102893, "3": 0.00040103814920829046, "4": 8.185092115712607e-05}, "score": 1.006488824297065}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.906423049381887, "5": 0.03626480381292827, "2": 0.03300461760105078, "3": 0.015188176737900199, "4": 0.00911432433785496}, "score": 1.2357843448960848}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9870482640475343, "2": 0.01067053152508113, "3": 0.0013778641447036862, "5": 0.0005222775011178526, "4": 0.00038043090011722144}, "score": 1.0166566730443543}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8445647694977446, "5": 0.13174413614361416, "3": 0.02353982526675966, "2": 0.00012624513818197696, "1": 0}, "score": 4.107954522049452}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8610915158646191, "5": 0.11549736074199828, "3": 0.0233222882123514, "2": 6.79649450283713e-05, "1": 1.0731877928496676e-05}, "score": 4.092007879814635}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7960921129868909, "5": 0.17750008343685292, "3": 0.026288492055166816, "2": 9.681689923934647e-05, "1": 1.2134869170669837e-05}, "score": 4.150983117123448}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7033847075062203, "4": 0.2952717973124239, "3": 0.001325602772961807, "2": 2.3573227755612025e-06, "1": 0}, "score": 4.7020652967322025}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5856558199060288, "5": 0.4047290532823113, "3": 0.009567168402553316, "2": 2.934774048008589e-05, "1": 0}, "score": 4.395110542670177}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5136101316849713, "5": 0.46795249248563087, "3": 0.01811530351275738, "2": 0.00018487271439217426, "1": 0}, "score": 4.449529118760382}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5451077649567831, "5": 0.43332643220855455, "3": 0.021428304300404905, "2": 0.00011476718039645852, "1": 1.5165506774599215e-05}, "score": 4.411626211328005}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7450153923079269, "5": 0.21635164692980596, "3": 0.03832639330097076, "2": 0.0002676083572009453, "1": 2.1011996950582427e-05}, "score": 4.177430185282128}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.534560032273361, "5": 0.44810930139339183, "3": 0.01722692004137351, "2": 8.522455171259164e-05, "1": 0}, "score": 4.430719909930846}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6432070180689865, "5": 0.3383546071077912, "3": 0.01826232654186966, "2": 0.00015650071176112498, "1": 1.74405605215986e-05}, "score": 4.319727631129854}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5487145599022437, "4": 0.32473081545104054, "2": 0.0759835051311449, "5": 0.043761843248021015, "1": 0.006714066337496429}, "score": 3.322873604914285}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5135201550720815, "2": 0.28474182114492985, "4": 0.16139346716802613, "1": 0.022558025011521467, "5": 0.017772321567850618}, "score": 2.8670783503143813}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.40999902390751314, "3": 0.39182271466462837, "5": 0.17246521759028421, "2": 0.023392505165396885, "1": 0.0022319737394760632}, "score": 3.7271374053190987}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5712775330704863, "4": 0.32952706131173043, "3": 0.09361813165462134, "2": 0.004270268812397663, "1": 0.0008444740925869154}, "score": 4.466801351636441}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.602971287183361, "5": 0.21587291520055618, "3": 0.1735116907536259, "2": 0.007050046968370071, "1": 0.0004467787733799253}, "score": 4.026924759698833}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7554611511258547, "5": 0.22874045556568628, "3": 0.015752955193149006, "2": 4.049109437527832e-05, "1": 0}, "score": 4.212907571441999}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8934384974927074, "5": 0.05801969831354512, "3": 0.04828496743483278, "2": 0.00023750900961216133, "1": 0}, "score": 4.009259891832356}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9372166751373554, "5": 0.04193889084880739, "3": 0.02078027208078495, "2": 4.0391952030798664e-05, "1": 0}, "score": 4.021078335895606}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9084080927452145, "5": 0.07519740173646881, "3": 0.016223102051976503, "2": 2.511874946619893e-05, "1": 0}, "score": 4.058932683136428}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7313003705536297, "5": 0.25890364850266834, "3": 0.009711123479742335, "2": 1.598000986966886e-05, "1": 0}, "score": 4.249177727730689}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6479406087460154, "4": 0.33943425607481287, "3": 0.012520090310969229, "2": 3.514156289346979e-05, "1": 0}, "score": 4.6353946514955755}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5083480135047439, "4": 0.43115788217690604, "3": 0.05962420876800272, "2": 0.0007076411804604595, "1": 0.00015826574617408835}, "score": 4.446835507396}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7053957966610263, "5": 0.26762573117184546, "3": 0.02688740009667571, "2": 7.587373354942687e-05, "1": 8.373471536611707e-06}, "score": 4.240563105004265}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5778728021570214, "3": 0.2931120851329975, "5": 0.11668138079726183, "2": 0.010675103760089281, "1": 0.001620487417486469}, "score": 3.797349896667708}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4692765150237462, "4": 0.4670530641678361, "3": 0.062336658954974304, "2": 0.0010221752749473136, "1": 0.0003010584879395561}, "score": 4.4039965833676735}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"4": 0.49485187679118436, "5": 0.47870380212990393, "3": 0.026168622511311104, "2": 0.000224051415268302, "1": 4.6808769037339496e-05}, "score": 4.451948837182648}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9074247376512073, "4": 0.09132897329935087, "3": 0.001240560978068286, "2": 1.7054833460234018e-06, "1": 0}, "score": 4.906184410913009}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6318981834182147, "5": 0.2984670611931154, "3": 0.06905419140191393, "2": 0.0005073545952111091, "1": 5.7566140594921465e-05}, "score": 4.228229032423022}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9337222330550202, "4": 0.06578154178426052, "3": 0.0004867251343844502, "2": 7.69074494669946e-07, "1": 0}, "score": 4.933242117863632}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5492049236485763, "4": 0.4236065934932841, "3": 0.0270049553050683, "2": 0.00014738947280395237, "1": 2.737306656731096e-05}, "score": 4.521827644024647}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7329195921815572, "5": 0.09902806343271248, "2": 0.07452537556357292, "3": 0.060975691148234354, "4": 0.03254804413992613}, "score": 1.6902353759102238}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5084443037368989, "4": 0.44030732058571154, "3": 0.049752299268162735, "2": 0.0010582450035513452, "1": 0.00043576245110846094}, "score": 4.455269169039535}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.650128099081033, "4": 0.23231933727229967, "3": 0.09527676567383224, "1": 0.013129328951611953, "2": 0.009140852742514008}, "score": 4.497184433393685}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.27223609305448465, "4": 0.26422086916155585, "5": 0.24283016244000888, "1": 0.11972502786641173, "2": 0.10098524115466795}, "score": 3.40944696430507}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32688743592231984, "4": 0.26310970618426666, "2": 0.24386265536942242, "1": 0.12937573937538663, "5": 0.03676120139137489}, "score": 2.8340174334519843}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9561841920315969, "2": 0.0288609329329456, "5": 0.008205107112380023, "3": 0.005423989305748631, "4": 0.0013229432363804116}, "score": 1.0764983866051723}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9437906183819085, "4": 0.050634759089263195, "3": 0.004920714674412797, "1": 0.0004133046440494657, "2": 0.0002368614942765089}, "score": 4.937159773372597}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7786362865687212, "4": 0.18916784296440262, "3": 0.02520282972737618, "1": 0.004773103770722369, "2": 0.002196410153013277}, "score": 4.734738611283094}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.993203515783381, "4": 0.004846987020327677, "1": 0.001019706946825861, "3": 0.0008392939124746774, "2": 8.720464152222861e-05}, "score": 4.989133947675117}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.4158961871432952, "5": 0.23637735241653657, "3": 0.13784192794882075, "4": 0.12003905869922352, "2": 0.08982145611279371}, "score": 2.6711720354483046}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5480398914865722, "3": 0.23663516786518557, "5": 0.19696179560308377, "2": 0.016089903749551417, "1": 0.0022630570562237134}, "score": 3.9213568481494394}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8566251790998751, "4": 0.1386466733994144, "3": 0.004661563369922342, "2": 2.381930908798454e-05, "1": 0}, "score": 4.851952410704719}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5095960428308082, "5": 0.3866331145617241, "3": 0.10133633955731933, "2": 0.001921498362804638, "1": 0.00048591516835957006}, "score": 4.28000361793704}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6088704558948068, "5": 0.27777823485094943, "3": 0.10919235797872348, "2": 0.003654284369094984, "1": 0.0004980256381678641}, "score": 4.159784292389882}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8410882162831064, "4": 0.15240942405655838, "3": 0.006399242212011918, "2": 3.296470876866484e-05, "1": 0}, "score": 4.834681599854442}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8015210211620815, "3": 0.12339594853734903, "5": 0.07317497412563098, "2": 0.001811842854521371, "1": 8.867921724426402e-05}, "score": 3.9458888945488546}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8852414910091515, "4": 0.11415170153330434, "3": 0.0005904871404240356, "2": 1.4465531056497804e-06, "1": 0}, "score": 4.8846612690054645}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7051877214877733, "4": 0.28767816682225505, "3": 0.0070869543538715244, "2": 2.7110674897040383e-05, "1": 0}, "score": 4.698060539567244}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8220878468408823, "4": 0.17475305777922323, "3": 0.003140465316728848, "2": 1.1330198083264531e-05, "1": 0}, "score": 4.818930699211602}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.814456719385616, "4": 0.1839379695909116, "3": 0.0015169841908424565, "2": 3.168351933697055e-06, "1": 0}, "score": 4.813002632559897}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4338581463662745, "4": 0.41523824048945884, "3": 0.1221327879909307, "2": 0.01973882836661357, "1": 0.008996438519673777}, "score": 4.245267107356398}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5070036886366317, "5": 0.46475606613346493, "3": 0.02780917157291467, "2": 0.00012505636528710998, "1": 0}, "score": 4.436830459504127}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5627081887754756, "5": 0.41495931487628984, "3": 0.02207204948696166, "2": 0.00019259904828875936, "1": 3.686588353644549e-05}, "score": 4.392403627063629}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8738379171583971, "4": 0.12376791751674615, "3": 0.0023733685591453136, "2": 9.58040204253882e-06, "1": 0}, "score": 4.871455162353188}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5423132242200133, "5": 0.42567139653821573, "3": 0.031417569636179685, "2": 0.0005350432356684598, "1": 4.7076717488376025e-05}, "score": 4.393048677075368}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"5": 0.766243174069831, "4": 0.22213706005057102, "3": 0.011296066626616698, "2": 0.00020391139432862664, "1": 7.729084840504461e-05}, "score": 4.754339469281499}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9239395237217667, "4": 0.06975162228394188, "3": 0.005989817109252253, "1": 0.0001614703537925806, "2": 0.00015146272543795747}, "score": 4.917167968315432}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9717174287003753, "4": 0.02807456704072895, "3": 0.00019392074757919916, "2": 2.3171119427991156e-06, "1": 0}, "score": 4.971530305142484}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9883379530300027, "4": 0.011540865739063757, "3": 0.00011623988825880284, "2": 7.94770852252884e-07, "1": 0}, "score": 4.98822422134275}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9814529747777698, "4": 0.01808544152494907, "3": 0.00044227278748486357, "2": 6.631331131082233e-06, "1": 0}, "score": 4.981009878119943}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7255160385575813, "3": 0.15437762001296668, "5": 0.11195417983621749, "2": 0.007002276279511009, "1": 0.0010921429539683424}, "score": 3.9402921307290564}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5602076558329762, "4": 0.42270241844666884, "3": 0.01685985376388029, "2": 0.00015600866615220224, "1": 4.1119545084446455e-05}, "score": 4.5429303122594265}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6999445369544783, "4": 0.2441517306571752, "3": 0.04422447544756822, "1": 0.006364022710016501, "2": 0.005309962000333185}, "score": 4.626011369852387}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7404994411258179, "4": 0.2536316909278264, "3": 0.005712512697540973, "2": 9.807775259869555e-05, "1": 3.5799271998564894e-05}, "score": 4.7344998853601945}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6554851831001927, "5": 0.2874898280690593, "3": 0.05445594787672867, "2": 0.0021465952429611814, "1": 0.00041762974311406533}, "score": 4.227488896056297}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8267648048442099, "3": 0.11863923847037199, "5": 0.05156990567439299, "2": 0.0026552074280877438, "1": 0.0003151877704711241}, "score": 3.926670607829533}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6966746802544239, "5": 0.27210975038649066, "3": 0.03097588129672522, "2": 0.00018495814531924816, "1": 3.556555303218263e-05}, "score": 4.240661868271677}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.695322209541898, "5": 0.2728202569739614, "3": 0.031581477036023896, "2": 0.00019248121373225871, "1": 0}, "score": 4.240873948607185}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8269260893166059, "5": 0.1403544458214683, "3": 0.0324555960252134, "2": 0.0002377096706879923, "1": 2.091846073724831e-05}, "score": 4.107361237721273}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5448350994058079, "5": 0.4461477963081834, "3": 0.008963223061433365, "2": 3.8313394387701164e-05, "1": 0}, "score": 4.437114751386196}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7765072264480974, "3": 0.11306429949746781, "5": 0.1086835315513768, "2": 0.001677859508514184, "1": 4.84866526979504e-05}, "score": 3.9921179065006815}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6779996549263885, "5": 0.2290826553862404, "3": 0.09176357927514178, "2": 0.0010782642571862207, "1": 3.951378340353815e-05}, "score": 4.135048912893809}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.631176544696947, "5": 0.24416220499109323, "3": 0.12261425375037345, "2": 0.0019566344480872982, "1": 6.67381369549473e-05}, "score": 4.117437242268338}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5356982193871699, "5": 0.445444713348579, "3": 0.01875404530943187, "2": 5.774186986681696e-05, "1": 0}, "score": 4.426594500534637}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7953643002334545, "5": 0.12309488478324199, "3": 0.080504032712896, "2": 0.0009905250518701268, "1": 3.807647197684708e-05}, "score": 4.040495903837401}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6025704445723241, "2": 0.35319523545326004, "3": 0.03983474331005462, "4": 0.0034098976595474326, "5": 0.0009776566726717203}, "score": 1.4470104158503887}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6413984360910917, "2": 0.2367588420474616, "3": 0.09414491828535242, "4": 0.019671163447658235, "5": 0.008007153094435933}, "score": 1.5161008386134747}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"1": 0.9623617841643475, "2": 0.035870114333581324, "3": 0.0016803255912989374, "4": 5.8466594559437964e-05, "5": 2.8882404185042588e-05}, "score": 1.0395217117888915}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.980479627721639, "2": 0.016807711164387836, "3": 0.0022311398067196616, "5": 0.000333158568380285, "4": 0.00014567113164228848}, "score": 1.0230397004600993}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.7006617313375358, "2": 0.25709325499549535, "3": 0.038363798939269673, "4": 0.003055035702034071, "5": 0.0008226155490703112}, "score": 1.346277656128741}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5901846057033102, "3": 0.3126708309904291, "5": 0.0714908006355326, "2": 0.022969914144758016, "1": 0.0026728873135745176}, "score": 3.704858244303393}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.982660614776411, "4": 0.01720974131428122, "3": 0.00012548893131189036, "2": 2.05914974192195e-07, "1": 0}, "score": 4.98253859412198}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9633480421427881, "4": 0.03631850093198234, "3": 0.00028461390939889486, "2": 3.1704154971567147e-07, "1": 0}, "score": 4.9631095299785715}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9860752764595441, "4": 0.013785824843347208, "3": 0.00013736746453409208, "2": 3.398848340834035e-07, "1": 0}, "score": 4.985938403820833}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9447168084475278, "4": 0.054517703238204616, "3": 0.0007580759344232025, "2": 1.9894208335596627e-06, "1": 0}, "score": 4.943959872727135}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7429526755756308, "5": 0.1585970294151483, "3": 0.09717575818600394, "2": 0.0011405211179670396, "1": 7.56850429701517e-05}, "score": 4.05891661050921}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6337084236099803, "5": 0.3049417512871513, "3": 0.06114314649940178, "2": 0.00019282625647960134, "1": 7.706472482909163e-06}, "score": 4.243391328709903}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6895394279430528, "5": 0.29849783473347313, "3": 0.011945107484034708, "2": 1.0132231273896834e-05, "1": 0}, "score": 4.286534611111132}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6808697390886863, "5": 0.26576925741044566, "3": 0.0530423514799881, "2": 0.0002200424666527675, "1": 0}, "score": 4.212307756570386}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7414904846912306, "5": 0.19216580728794266, "3": 0.0654105642950938, "2": 0.0008206977211889527, "1": 0}, "score": 4.125127917684871}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5162689388273148, "5": 0.37462526349082936, "3": 0.10731431792396486, "2": 0.001682724622762207, "1": 9.532752159128391e-05}, "score": 4.263663054122161}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8778395911896503, "4": 0.11704649850691645, "3": 0.005090278677084798, "2": 1.635303583296215e-05, "1": 0}, "score": 4.87272295863395}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8536560654309254, "4": 0.13351579413664844, "3": 0.012613125511037094, "2": 0.0001344704615191108, "1": 0}, "score": 4.840841724139357}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5812540060356368, "5": 0.3326382552653422, "3": 0.08461193048765198, "2": 0.0014090127459640716, "1": 7.59592154907047e-05}, "score": 4.24498307633713}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6617192014654527, "4": 0.300931053081892, "3": 0.036930651824597746, "2": 0.00036934994607103585, "1": 3.346190267018591e-05}, "score": 4.62395962321359}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6439298418751248, "4": 0.3507843611528298, "3": 0.005212271133830324, "2": 2.1272380857798507e-05, "1": 0}, "score": 4.638708400701758}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.949763607084427, "4": 0.049659523211767954, "3": 0.0005574786228660849, "2": 1.262596806904907e-06, "1": 0}, "score": 4.949220811202361}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7341248789717613, "4": 0.2571835620036322, "3": 0.008630977609010831, "2": 2.817553527481746e-05, "1": 0}, "score": 4.725461059496472}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9932817222172967, "4": 0.006706480374275527, "3": 9.451784483998656e-06, "1": 0, "2": 0}, "score": 4.993274600281498}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9255038380273833, "4": 0.07398092420668065, "3": 0.0004976263817292859, "2": 8.237934548892221e-07, "1": 0}, "score": 4.925020092917502}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5177828153651478, "5": 0.4632742813369046, "3": 0.018794094139781406, "2": 0.00011677004319050453, "1": 1.6300251839415847e-05}, "score": 4.444204737632795}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9336757815294171, "4": 0.06421238333811362, "3": 0.0020712106243034596, "2": 2.961631991770275e-05, "1": 7.987681623921607e-06}, "score": 4.93152418889539}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5326375526076068, "4": 0.4588593467398931, "3": 0.008394848794421582, "2": 1.559216520994981e-05, "1": 0}, "score": 4.524260097262361}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9344787516614249, "4": 0.06504575718860892, "3": 0.0004537909175645803, "2": 1.9636550498313224e-06, "1": 0}, "score": 4.934039468175973}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5622476881129929, "5": 0.4207283260054093, "3": 0.01692602839735327, "2": 8.407233489315416e-05, "1": 7.478517356474655e-06}, "score": 4.403614303194509}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6521221421594733, "4": 0.2944001743223629, "3": 0.05216850075736135, "2": 0.0011013682593604395, "1": 0.00014532789844547093}, "score": 4.5973522477008055}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5313467806469429, "5": 0.3673560271299809, "3": 0.0972895398188825, "2": 0.003689967605372796, "1": 0.0003019744943351118}, "score": 4.261784741335345}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8128167943754605, "4": 0.17343737426503553, "3": 0.013512048636215865, "2": 0.00018474039290541488, "1": 0}, "score": 4.798974448522306}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8028051877584929, "4": 0.18633541925260455, "3": 0.010713121290077092, "2": 0.00012616070842943436, "1": 1.699160770860588e-05}, "score": 4.791791240128317}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5093866113288477, "5": 0.44276540899495603, "3": 0.04658736089816749, "2": 0.0010834022044400738, "1": 0.0001626039611225497}, "score": 4.3935291822939755}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7116159707535459, "3": 0.14265285321720683, "5": 0.14078451781561668, "2": 0.004556675401414937, "1": 0.00037398831662809555}, "score": 3.9878961552508048}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7828318006905797, "3": 0.134222850091569, "5": 0.0792182957417065, "2": 0.003524574708738374, "1": 0.00019856381963776206}, "score": 3.937350359503678}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7542244773230666, "3": 0.16803427542521882, "5": 0.06661313491069291, "2": 0.010616131447618672, "1": 0.0005041901899821472}, "score": 3.875833058672476}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8701908792166729, "5": 0.08116390908636818, "3": 0.04837006250120262, "2": 0.0002414328928219844, "1": 0}, "score": 4.03231207024307}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6332217134178323, "5": 0.32020780606508054, "3": 0.045655006798661586, "2": 0.0007973012266117723, "1": 0.00011429171208328289}, "score": 4.272616379641066}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7596606565151076, "4": 0.23421328603193767, "3": 0.006103481090497744, "2": 1.5366419213536726e-05, "1": 0}, "score": 4.753531875508237}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6763679136692586, "4": 0.3132399088783093, "3": 0.010322740519158146, "2": 4.8325484840869115e-05, "1": 0}, "score": 4.665962581615118}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6772549764627511, "4": 0.31583230077910385, "3": 0.0068918549960264265, "2": 1.5152257912274431e-05, "1": 3.4710271470908953e-06}, "score": 4.670323908396093}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6633954573636103, "4": 0.32428153672201504, "3": 0.012262824397577471, "2": 4.4367404101424656e-05, "1": 9.853833408132245e-06}, "score": 4.651018216908}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5271662053457136, "4": 0.4571005456151984, "3": 0.015608817500730371, "2": 9.986582728979412e-05, "1": 1.4526892080385994e-05}, "score": 4.5113192085551415}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5778299024726453, "4": 0.41546716212498946, "3": 0.006674893699441063, "2": 2.4024269725766833e-05, "1": 2.1622504578776534e-06}, "score": 4.571101532980086}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6907909040956853, "4": 0.2925037476247489, "3": 0.01651408872974404, "2": 0.00011401494747081156, "1": 3.924231221712251e-05}, "score": 4.673956670431276}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8206677096573953, "4": 0.1704171711507189, "3": 0.008842773563633995, "2": 4.274428738207756e-05, "1": 0}, "score": 4.811763476806381}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.66176425284222, "4": 0.3204309405314971, "3": 0.01762754753034527, "2": 0.00012775706846002204, "1": 3.750786176102856e-05}, "score": 4.643776389150367}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9150055300082642, "4": 0.08229789078494534, "3": 0.0026700571561535996, "2": 1.8292361310233885e-05, "1": 5.510506584030974e-06}, "score": 4.912284837278923}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5381021322183517, "4": 0.38966327898882275, "2": 0.06179425994383087, "5": 0.008129950044737731, "1": 0.0022741709740558705}, "score": 3.339592873107442}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8053067808000154, "4": 0.19145597353590352, "3": 0.0032061594216556237, "2": 3.4405404202769235e-06, "1": 0}, "score": 4.802115915355089}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7444737768326695, "4": 0.25225785007868423, "3": 0.003150445208814558, "2": 3.9072256040828065e-06, "1": 0}, "score": 4.74140005209163}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9580883058144468, "4": 0.04128299942331293, "3": 0.0005921908460189049, "2": 7.775779038769675e-07, "1": 0}, "score": 4.957528768809363}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9382756586426356, "4": 0.061041458385464105, "3": 0.0006564917703129473, "2": 6.174763924656215e-07, "1": 0}, "score": 4.937642098449315}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6830163644739908, "4": 0.3026314955291585, "3": 0.014142279813552996, "2": 0.00013745100934757843, "1": 0}, "score": 4.66864759886204}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9514569382214522, "4": 0.047658084454963764, "3": 0.0008531623502811128, "2": 9.615453636050694e-06, "1": 0}, "score": 4.950605647952677}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9878999683197356, "4": 0.011871692430822216, "3": 0.00022213083563125117, "2": 1.9404046968900933e-06, "1": 0}, "score": 4.98767817209415}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9917112348247386, "4": 0.00819576517653457, "3": 8.507783624166572e-05, "2": 7.862445190167006e-07, "1": 0}, "score": 4.991631660701642}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6370782815418061, "4": 0.3380800761066817, "3": 0.024011713624811793, "2": 0.000577204750990016, "1": 0.00020368273404659646}, "score": 4.611331090648626}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6416144313052774, "5": 0.24395519441441635, "3": 0.11263771191875514, "2": 0.0014479268561543958, "1": 0}, "score": 4.128465915545674}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5505176288443422, "5": 0.3204850979366188, "3": 0.12596230291615523, "2": 0.002069655729060851, "1": 0}, "score": 4.190567441090523}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5398999685550888, "3": 0.2292359171111708, "5": 0.2215745006497646, "2": 0.007071172296630906, "1": 0}, "score": 3.978147761034004}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6054033190507399, "5": 0.2759753027661903, "3": 0.11608488363547977, "2": 0.00214753308057213, "1": 0.0002704181752210997}, "score": 4.154802449235814}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6176922765006175, "3": 0.20489734118102007, "5": 0.17174104310689728, "2": 0.005057363393319861, "1": 0.00040398088317356994}, "score": 3.955507778332964}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.785860486813703, "4": 0.15920172025633336, "3": 0.045381915059636554, "1": 0.006040400266155978, "2": 0.00351152697672902}, "score": 4.715337143032689}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7586194581327058, "4": 0.21750735781306516, "3": 0.02264220808832246, "2": 0.0006209804239236835, "1": 0.000578879163957415}, "score": 4.733021460677534}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8236076050162664, "4": 0.15710674503229385, "3": 0.018552196263182406, "2": 0.0003951027501216629, "1": 0.00032977828267230264}, "score": 4.803282754671119}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9740540763638734, "4": 0.025571119726609155, "3": 0.0003666762690025697, "2": 8.771586150334994e-07, "1": 0}, "score": 4.973692705518977}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9328855075252708, "4": 0.06014021057587296, "3": 0.006685158225315186, "2": 0.00014609316840796, "1": 8.784409170033157e-05}, "score": 4.925695716514563}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5608820753066307, "4": 0.3015280898971381, "2": 0.09930338697531033, "5": 0.024801592851268314, "1": 0.013484134592705322}, "score": 3.224859781422757}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5320288828727554, "3": 0.3839874343410515, "5": 0.060424193476204854, "2": 0.021822003136895925, "1": 0.001735968687605943}, "score": 3.6275842816630957}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7071048227014464, "5": 0.19578747877220284, "3": 0.0954606937489436, "2": 0.001542701775566003, "1": 0.00010122659896738991}, "score": 4.096937999895567}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5266878926191141, "4": 0.4391050327359328, "5": 0.017783112641801924, "2": 0.015930161770930054, "1": 0.0004922108383669324}, "score": 3.4577574021286743}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5405942616370264, "4": 0.315340270300987, "2": 0.12507390204742325, "5": 0.013780289567647876, "1": 0.00521045549486997}, "score": 3.207406206669669}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4340747780800532, "4": 0.2871380409316058, "2": 0.2109354956635288, "1": 0.04291221764518961, "5": 0.024930036932492856}, "score": 3.040238563322399}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.559592633580863, "5": 0.24082474721538985, "3": 0.18374453184475295, "2": 0.014135597751208824, "1": 0.001679481775696458}, "score": 4.023771121463101}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6405036237320963, "5": 0.17924888856425225, "3": 0.1740278387063193, "2": 0.0057553570329061925, "1": 0.00045406749662190555}, "score": 3.99234805506519}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5525473985716297, "4": 0.3962307640314642, "3": 0.048692970608480414, "2": 0.0019495435709182848, "1": 0.0005186607756291681}, "score": 4.498429594450729}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5944723937560807, "5": 0.315877310088802, "3": 0.08574909044909339, "2": 0.003574190721751899, "1": 0.00031725363296786294}, "score": 4.222030244612519}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.619519748681838, "5": 0.34032069000978055, "3": 0.03990955939289901, "2": 0.00021056292887361086, "1": 0}, "score": 4.3000018365275485}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5190686141637857, "4": 0.4480492587699508, "3": 0.03267185418518553, "2": 0.00018938207929187584, "1": 0}, "score": 4.486028149337748}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7412973293377286, "4": 0.24383456400961726, "3": 0.01471232795885325, "2": 0.00011100203760706711, "1": 0}, "score": 4.726395522866249}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.785778187954574, "4": 0.21250018925633818, "3": 0.001716903330585105, "2": 2.4964396029204417e-06, "1": 0}, "score": 4.784058034720613}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7503515116867506, "5": 0.2079117017974771, "3": 0.04150825316798885, "2": 0.00019896990019132433, "1": 0}, "score": 4.166010416669359}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9864536400478169, "4": 0.013466448275237188, "3": 7.793140821630239e-05, "2": 2.44660329148082e-07, "1": 0}, "score": 4.986376931283031}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9712048780360588, "4": 0.02851860778557775, "3": 0.0002736496279386931, "2": 7.796763026502021e-07, "1": 0}, "score": 4.970931693325875}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9471870015237795, "4": 0.052250171805452036, "3": 0.0005481481285334327, "2": 2.9386037628931226e-06, "1": 0}, "score": 4.94664408973109}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.969926325948178, "4": 0.02992587464685948, "3": 0.0001363057546068583, "2": 3.9603232509326537e-07, "1": 0}, "score": 4.9697999905987835}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7945232974693378, "4": 0.2044353275939699, "3": 0.0010172914752291369, "2": 3.086724690292689e-06, "1": 0}, "score": 4.793516493801674}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.49328066831804745, "4": 0.4316740238473653, "5": 0.03800885956434595, "2": 0.03498655969350386, "1": 0.002046640726336372}, "score": 3.468613423816177}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7402096367487967, "4": 0.1703130099376049, "2": 0.076716612764558, "5": 0.00894724155809485, "1": 0.0038098327059768195}, "score": 3.1038715957001526}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.729929956093572, "3": 0.1847890822968508, "5": 0.08353820557281333, "2": 0.0016291018960978058, "1": 0}, "score": 3.8954790402439046}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6515946974664427, "4": 0.31036064088052645, "2": 0.026235757726105435, "5": 0.011390423733229212, "1": 0.00040448819745507816}, "score": 3.3061010371905306}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5726965234823498, "3": 0.34396007135087764, "5": 0.06954889837933678, "2": 0.012854704830276186, "1": 0.0009307353363460666}, "score": 3.6970844649385732}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8326286121422369, "2": 0.1422591620450849, "3": 0.022718981828949887, "4": 0.0019063758502204221, "5": 0.000485035923838363}, "score": 1.1953567548835347}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9836001058748076, "2": 0.015539253072973578, "3": 0.0007994192751150056, "4": 3.658497210864128e-05, "5": 2.3405582398828444e-05}, "score": 1.0173414902203595}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.39124942765166026, "1": 0.2993731471190605, "3": 0.28246396332044604, "4": 0.02397038185798577, "5": 0.002857290445193071}, "score": 2.0396068491089023}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9905138689231129, "2": 0.009114212232355055, "3": 0.0003474903371877486, "4": 1.2549283319914473e-05, "5": 1.08016679061872e-05}, "score": 1.0098900580854073}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9354324436865846, "2": 0.05617837964082117, "3": 0.007452848281438737, "4": 0.0006143418658452534, "5": 0.0003057847912529262}, "score": 1.074151442348195}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"4": 0.528905712632257, "5": 0.45396153917632365, "3": 0.01695281300378446, "2": 0.0001292567269364627, "1": 0}, "score": 4.436772347668922}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9661438382252064, "4": 0.03248369525479659, "3": 0.001358667281177837, "2": 9.05699654540239e-06, "1": 2.6039969627429154e-06}, "score": 4.964761307856393}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5274809647842934, "4": 0.4333812167989753, "3": 0.03862400904060549, "2": 0.00045148491342797555, "1": 5.702972128342704e-05}, "score": 4.48778547945096}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5200758565838324, "5": 0.45997842167566727, "3": 0.019826709215894734, "2": 0.00010096082375330222, "1": 1.1176893400550402e-05}, "score": 4.43991928449244}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.683640318372475, "4": 0.29014699648299824, "3": 0.02587055835265262, "2": 0.00028467140721567737, "1": 4.825071073638485e-05}, "score": 4.6570617131119985}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6160803842807236, "3": 0.32281763910879047, "5": 0.0550202488827466, "2": 0.0059194484598043134, "1": 0.00015488370700981124}, "score": 3.719896990214444}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7897426232165818, "3": 0.11770222039800567, "5": 0.09153658962701215, "2": 0.0008805331338630755, "1": 0}, "score": 3.972069447605898}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6265462841753203, "5": 0.24247278541380934, "3": 0.1291393790684548, "2": 0.0016366442867840616, "1": 0.00017430115133169798}, "score": 4.109540566905898}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6957158385230428, "5": 0.28437769852592826, "3": 0.01979573041777948, "2": 6.606886175072322e-05, "1": 0}, "score": 4.26446164221256}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6003948841471828, "5": 0.33639682133217474, "3": 0.06240544798287234, "2": 0.0006818385897860366, "1": 0.00010768492023427381}, "score": 4.272308269379657}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7126561307270541, "4": 0.27543131274614163, "3": 0.01176270906936389, "2": 0.00010499193712929563, "1": 4.1381816027916235e-05}, "score": 4.7005617258796155}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9474654803855439, "4": 0.052402483171964755, "3": 0.00013186379818694665, "2": 8.926610360621745e-08, "1": 0}, "score": 4.9473335170421135}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8346745087559615, "4": 0.16361650067955952, "3": 0.001697029855125507, "2": 3.1165934362444116e-06, "1": 0}, "score": 4.83297861267337}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5077270393135263, "5": 0.483887324494005, "3": 0.008375308216316026, "2": 8.419913524602594e-06, "1": 0}, "score": 4.475496083726947}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6899511230908806, "4": 0.3082699249799788, "3": 0.0017768868616735065, "2": 1.7859554854155547e-06, "1": 2.0489872587461043e-07}, "score": 4.6881701006934025}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6610971669562963, "3": 0.31845149740788903, "5": 0.015849020162030495, "2": 0.0045236436166126584, "1": 7.4717740803499e-05}, "score": 3.6881248491078673}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8468422561383804, "3": 0.09848300340079014, "5": 0.05448029512663451, "2": 0.00018760516308421473, "1": 4.048415451281119e-06}, "score": 3.9556098122267636}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8654832824801184, "5": 0.12040635079882141, "3": 0.014100401596251028, "2": 5.946575799205079e-06, "1": 0}, "score": 4.1062944832005615}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9068256758149537, "4": 0.09275654629363124, "3": 0.0004144592083220316, "2": 4.090100946141477e-07, "1": 0}, "score": 4.906413035951979}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7501418177453276, "5": 0.22906588714959109, "3": 0.02075943991696453, "2": 2.517145357969598e-05, "1": 0}, "score": 4.208257704522385}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7044921784331958, "4": 0.22149403940377538, "2": 0.07026211009015461, "5": 0.002522764386324706, "1": 0.0012258770892014427}, "score": 3.1538261700930508}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.707916507147649, "5": 0.2395671561439945, "3": 0.05168389782714687, "2": 0.0007356006364664855, "1": 7.612034372340111e-05}, "score": 4.186187553428047}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5810488189085669, "5": 0.37138144162927983, "3": 0.04713486586029807, "2": 0.00034320916025052495, "1": 6.048361839034039e-05}, "score": 4.323388790122004}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5278769350497302, "4": 0.4627767141848918, "3": 0.009289997455993215, "2": 3.03205760002751e-05, "1": 0}, "score": 4.51853979544998}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.709991216606541, "3": 0.17519297470492545, "5": 0.10348607669623777, "2": 0.009235153905613611, "1": 0.0020796728110958266}, "score": 3.903582338614984}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7638579396283269, "3": 0.1890176277033531, "5": 0.041684330007363234, "2": 0.005121335674636358, "1": 0.0003172913883965895}, "score": 3.8414719228658467}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5800627451498508, "4": 0.39738181891462654, "3": 0.022371503392365842, "2": 0.0001406559106631367, "1": 3.3693554500886014e-05}, "score": 4.557314190058006}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7077752352691421, "5": 0.1804266418792647, "3": 0.11090816083525527, "2": 0.0007644881752604469, "1": 0.00010160945155809958}, "score": 4.067686291630842}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5972838009920333, "5": 0.36196147336089074, "3": 0.04057363530641911, "2": 0.00014740318066232863, "1": 2.7262102691120897e-05}, "score": 4.321013307913972}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5379719272577905, "5": 0.4120103123376921, "3": 0.0494775325660586, "2": 0.0004505431513691104, "1": 8.160859260550322e-05}, "score": 4.361389786309139}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6674927167521463, "3": 0.19834056511592457, "5": 0.12719267706208168, "2": 0.006198447013502596, "1": 0.0007642517556320194}, "score": 3.9141614890460517}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.702401009111573, "4": 0.1989354258764665, "2": 0.08868818503038321, "5": 0.006795778964866566, "1": 0.0031705582579153245}, "score": 3.1174987447727935}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6517222335443197, "3": 0.20627626838716878, "5": 0.1373718769877401, "2": 0.004186192790495011, "1": 0.0003426459019073579}, "score": 3.921687392782265}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.591648837498568, "3": 0.22911078846365748, "5": 0.17041468307818305, "2": 0.008377828725749943, "1": 0.0004219268922710886}, "score": 3.9232804667389125}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5466963770754875, "3": 0.2517859392188411, "5": 0.19476037932811838, "2": 0.006293761967560648, "1": 0.0004130304247669452}, "score": 3.9291442458350474}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8258734214505337, "3": 0.13951747733677758, "5": 0.03134110450544299, "2": 0.0031406798178351117, "1": 0.0001186920777929664}, "score": 3.8851852010436043}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7876908251387638, "5": 0.18280568881758702, "3": 0.02931540011044154, "2": 9.971334882890658e-05, "1": 0}, "score": 4.153304409916389}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8978906398501681, "5": 0.06400942121320144, "3": 0.03775746026114994, "2": 0.000312534404639941, "1": 1.620110675256403e-05}, "score": 4.025578640353966}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.819531552011553, "5": 0.16891293066288807, "3": 0.01148327557450041, "2": 5.043551340355088e-05, "1": 0}, "score": 4.1573322148852485}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5299226375377931, "5": 0.46272717196191376, "3": 0.007258529636971776, "2": 5.050233424893556e-05, "1": 0}, "score": 4.455386380690031}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5145263758538391, "4": 0.40541692376174027, "3": 0.0754312827068512, "2": 0.0038248424580108794, "1": 0.0007904187418159968}, "score": 4.429078509931855}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4336561239842186, "4": 0.29074784484785027, "2": 0.16128875679002708, "5": 0.09193217519125174, "1": 0.022371666704936698}, "score": 3.2685810269299176}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6056266329713615, "3": 0.2422165786398335, "5": 0.13954129500293894, "2": 0.011142950758269383, "1": 0.0014676350254010139}, "score": 3.8706352748997546}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5160718185237981, "5": 0.3417890995909782, "3": 0.1374624761289632, "2": 0.0042020843625491505, "1": 0.0004621594021923892}, "score": 4.194538381412162}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5536762219489115, "3": 0.3193766345731516, "5": 0.11037319207871003, "2": 0.015228166602264948, "1": 0.0013304346308765445}, "score": 3.756545183336529}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5617259620615258, "5": 0.40496197709459475, "3": 0.03298513412741909, "2": 0.00028140658857524317, "1": 4.0909346509819045e-05}, "score": 4.371293013701409}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6421244157915408, "5": 0.3307833002589642, "3": 0.026900583531198903, "2": 0.00014973731985194405, "1": 0}, "score": 4.303595981916137}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6636756883379271, "5": 0.2549782325541613, "3": 0.07855706308426512, "2": 0.002264613895819218, "1": 0.00042806264768422054}, "score": 4.170624191581122}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5490795984023091, "4": 0.43501602912897, "3": 0.01563011151339479, "2": 0.00015573137346009923, "1": 0}, "score": 4.533201224260156}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5712167580867256, "5": 0.33986948592275734, "3": 0.08457149564957506, "2": 0.003485479690182496, "1": 0.000839135804395816}, "score": 4.245813960829202}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9384150489063371, "4": 0.06067186484414429, "3": 0.0009096041982939103, "2": 2.096358009567107e-06, "1": 0}, "score": 4.937502551082948}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.894398136592258, "4": 0.10180887478815338, "3": 0.0037768875802191956, "2": 1.2016642427889923e-05, "1": 2.6313514090548527e-06}, "score": 4.890590615741671}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9248076676077956, "4": 0.07437670433130542, "3": 0.0008063382003940488, "2": 1.164782713918514e-06, "1": 0}, "score": 4.924006507466727}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979046340506671, "4": 0.0020812689482764303, "3": 1.313819396421588e-05, "1": 0, "2": 0}, "score": 4.997892452643064}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8603051130833587, "4": 0.1320695369536746, "3": 0.007593634108423083, "2": 2.4134287758948217e-05, "1": 0}, "score": 4.852669674971504}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7486947813886415, "5": 0.14905364563737722, "3": 0.1009498116500169, "2": 0.0011836528340510557, "1": 0}, "score": 4.045741930829634}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8118517576157593, "4": 0.18606088874408186, "3": 0.0020650073360683075, "2": 3.226224467279748e-06, "1": 0}, "score": 4.809795781190572}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.925253837682069, "4": 0.07406283681129296, "3": 0.0006706474291460648, "2": 1.0251557558411404e-06, "1": 0}, "score": 4.924591914138624}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.936627421457553, "4": 0.06290447330990262, "3": 0.00046416614440099064, "2": 1.0500823167111027e-06, "1": 0}, "score": 4.936163859731363}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.636567358620661, "4": 0.3545559207621881, "3": 0.008849223180761454, "2": 1.807264660601512e-05, "1": 0}, "score": 4.627687905973251}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"2": 0.38509529339866827, "3": 0.3633956475915565, "4": 0.12658034931507747, "1": 0.11318099681095456, "5": 0.011729869989116008}, "score": 2.538574569107391}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6660975817703061, "3": 0.21289757446172455, "5": 0.11397498323229922, "2": 0.005927383466642013, "1": 0.0010977677271836505}, "score": 3.885928801455471}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6196846496101454, "4": 0.355031912209151, "3": 0.0251012985279824, "2": 0.00015046636306269802, "1": 0}, "score": 4.594301241831414}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6628117935901484, "4": 0.3154590813574669, "3": 0.021560406042038776, "2": 0.0001367899527887071, "1": 2.1363749946242326e-05}, "score": 4.640920487914803}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7152070055061598, "5": 0.1769363527604357, "3": 0.10575273484200834, "2": 0.001957668606930373, "1": 0.00013966162852140272}, "score": 4.066849735466712}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8279954332588082, "4": 0.16790589589499827, "3": 0.004033539502627587, "2": 2.6764531459194276e-05, "1": 0}, "score": 4.823939976643533}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.913667051637878, "4": 0.08198462084323259, "3": 0.004269934890433052, "2": 4.2630227098593345e-05, "1": 1.8094998207664445e-05}, "score": 4.9092736358025215}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9504957266126038, "4": 0.047268082492439314, "3": 0.002185260140684189, "2": 2.601148205310377e-05, "1": 1.544125089706542e-05}, "score": 4.948221107014993}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9188551647239956, "4": 0.07919694136787346, "3": 0.0019198248904352337, "2": 1.0554544843002428e-05, "1": 0}, "score": 4.916930290294552}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9790537646824118, "4": 0.0204401944598622, "3": 0.0004849794689425671, "2": 3.64299650249526e-06, "1": 0}, "score": 4.97857854448543}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6203408710544223, "4": 0.35253985475014077, "3": 0.02679853385137653, "2": 0.00020902159206916384, "1": 0}, "score": 4.593190564528469}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9219825517074521, "4": 0.07621169121805141, "3": 0.0017604648244508349, "2": 4.939136695659791e-06, "1": 0}, "score": 4.92024934353568}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9086176821248518, "4": 0.0906443111459858, "3": 0.0006435475763108867, "2": 1.6124109735535035e-06, "1": 0}, "score": 4.908055219695188}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9157566642329814, "4": 0.08349227219258575, "3": 0.000734097282989006, "2": 1.391152524588576e-06, "1": 0}, "score": 4.915034036427176}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830637769806099, "4": 0.016700405139556673, "3": 0.000189004260656999, "2": 2.4505577481608196e-07, "1": 0}, "score": 4.98292005578334}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6794248347357834, "5": 0.2170984156312334, "3": 0.10259619835521804, "2": 0.0008046597827525877, "1": 6.6429587888632e-05}, "score": 4.112694675253395}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6384461278836453, "3": 0.21211642086860155, "5": 0.14659284455966892, "2": 0.0026861092710692173, "1": 0.00014564229161348024}, "score": 3.9286663612712167}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6486567777566324, "3": 0.2964470084873799, "5": 0.043993882008188885, "2": 0.01009814333753688, "1": 0.0007903157569635468}, "score": 3.724975824259806}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5460445571855093, "5": 0.41885700255296965, "3": 0.03497410669501822, "2": 6.67864728615895e-05, "1": 0}, "score": 4.3837714078413725}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6561570586633492, "3": 0.30447393342867207, "5": 0.0379677638127691, "2": 0.0013560191054476866, "1": 3.243809675941484e-05}, "score": 3.7306810341301224}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6017760577346077, "5": 0.3047291895222508, "3": 0.09206206590417537, "2": 0.001333198415533657, "1": 5.792746114916882e-05}, "score": 4.209835665375734}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9143508948395759, "4": 0.0812948508184967, "3": 0.004280717257075972, "2": 5.047628176658156e-05, "1": 1.1891472635129263e-05}, "score": 4.909943714063095}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.555780770582916, "5": 0.2621449457871794, "3": 0.17934655203008337, "2": 0.002609992320471365, "1": 0.0001033656351268494}, "score": 4.077269422853967}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6683517314061298, "4": 0.3206602909097608, "3": 0.010907622742422808, "2": 5.340153858286457e-05, "1": 0}, "score": 4.657355023541473}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9082534893949629, "4": 0.0877693612454511, "3": 0.003913638402276563, "2": 3.497356736285266e-05, "1": 0}, "score": 4.9042957100972675}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7901324099768624, "5": 0.18183914525178743, "3": 0.027892428692829523, "2": 5.114667871156773e-05, "1": 0}, "score": 4.153857480993603}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8217854234787535, "5": 0.1270370503538832, "3": 0.051029294969606676, "2": 0.00010305394180258312, "1": 0}, "score": 4.075805072165819}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5314981829109776, "5": 0.456986101967519, "3": 0.011436629049014527, "2": 1.563563427876195e-05, "1": 0}, "score": 4.445546471768824}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6127926100171266, "4": 0.37876682526625843, "3": 0.00803075928061325, "2": 8.700578850298418e-06, "1": 0}, "score": 4.60498711284829}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7564199557576793, "5": 0.19843505722859953, "3": 0.04494580717256019, "2": 6.910192288562799e-05, "1": 0}, "score": 4.153370996390202}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9447784097706103, "4": 0.05447260849929646, "3": 0.0007121193743513063, "2": 7.254177849249414e-06, "1": 0}, "score": 4.944079734521285}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.969758575209447, "4": 0.030028990918470735, "3": 0.00018319122597879603, "1": 0, "2": 0}, "score": 4.969603737762432}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9250274280161219, "4": 0.07428237272661932, "3": 0.0006559541924766524, "2": 1.8578846544304467e-06, "1": 0}, "score": 4.9243976966890495}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.985878736733585, "4": 0.013943041672471967, "3": 0.00016959013543614842, "2": 6.966595472264909e-07, "1": 0}, "score": 4.985715574733971}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9910949172255393, "4": 0.0087388690237922, "3": 0.00015562644587895414, "2": 1.8165708181509069e-06, "1": 0}, "score": 4.990944348947289}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8199860098728924, "5": 0.1377199229473086, "3": 0.042083034521466084, "2": 0.00019260039648681608, "1": 1.7728323492848035e-05}, "score": 4.095198569676314}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.856245255879275, "5": 0.10661100885730931, "3": 0.03703273602768965, "2": 0.00010325080805037538, "1": 6.731530672332194e-06}, "score": 4.069351647144985}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5087947425744898, "5": 0.4831821375672602, "3": 0.00800338741537746, "2": 1.3593157728801645e-05, "1": 0}, "score": 4.475154480945272}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.830356701225037, "4": 0.16737288689907673, "3": 0.002256739966028884, "2": 9.593373099443626e-06, "1": 0}, "score": 4.828084151884461}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6215365254047498, "4": 0.37433131677208353, "3": 0.004120342450588593, "2": 4.3122920373187826e-06, "1": 0}, "score": 4.617412190863481}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6133421942529657, "4": 0.34709234865164007, "3": 0.03821379893240348, "2": 0.0009200371576378476, "1": 0.00035791297059984897}, "score": 4.5722567620147885}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7302184083992252, "4": 0.25700046108075136, "3": 0.01265038031289569, "2": 9.84539137487421e-05, "1": 2.944277526601188e-05}, "score": 4.717284838718313}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.904973674188308, "4": 0.09101975573847698, "3": 0.003975129312334781, "2": 1.8083529614728906e-05, "1": 6.582407487403774e-06}, "score": 4.9009487343631895}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.973598366601237, "4": 0.02587139139804353, "3": 0.0005256150275360832, "2": 1.777963410687902e-06, "1": 0}, "score": 4.973071967938425}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8123663911189639, "4": 0.1746208372349675, "3": 0.012829689522306158, "2": 0.00012704362837334424, "1": 3.4726967898030474e-05}, "score": 4.799195465512351}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7195835766888002, "4": 0.2717108580417463, "3": 0.00864625153946045, "2": 1.9038943853857315e-05, "1": 0}, "score": 4.710927879729948}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.895721159819768, "4": 0.1006463894368777, "3": 0.003617587180842115, "2": 6.191432972987136e-06, "1": 0}, "score": 4.892098926170429}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9445395980863711, "4": 0.05399506637595466, "3": 0.0014383761144830865, "2": 3.105412503605689e-06, "1": 0}, "score": 4.943117508282004}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903072484826951, "4": 0.009571359740149561, "3": 0.00011861898598763334, "2": 1.6642168475709202e-07, "1": 0}, "score": 4.990190877456623}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9535862460127044, "4": 0.045665316863159194, "3": 0.0007406213958614711, "2": 1.4665277882809126e-06, "1": 0}, "score": 4.952848741388959}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6564798360692581, "2": 0.22509494230055407, "4": 0.1048419081606082, "1": 0.01086247597641975, "5": 0.0027175857084995826}, "score": 2.86345674131494}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.49745996399680875, "2": 0.3978719337403351, "4": 0.08039315043668216, "1": 0.0220631054979264, "5": 0.002209092900441471}, "score": 2.6428122080105787}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5672996112008601, "2": 0.3834443421492846, "4": 0.03648994630623716, "1": 0.01220317274484587, "5": 0.0005591152132797743}, "score": 2.629756077581262}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6415453331520281, "2": 0.223865691157896, "4": 0.11576667915791593, "1": 0.015565209741166664, "5": 0.003245942578409987}, "score": 2.867260974402587}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7033779691129993, "3": 0.22239153041438617, "1": 0.0689691483318989, "4": 0.005156569738050904, "5": 0.00010449336305622795}, "score": 2.16404904906443}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6128652302440771, "4": 0.37281502271511424, "3": 0.014158445185914616, "2": 0.00011251556391247984, "1": 0}, "score": 4.598510953059851}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7964413874286017, "4": 0.1972752336871791, "3": 0.006209196993580508, "2": 3.4853046746579806e-05, "1": 0}, "score": 4.790193561740763}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5875796486398269, "4": 0.3970094639158952, "3": 0.015234830382749132, "2": 0.00014726571763124639, "1": 2.270040028345521e-05}, "score": 4.571985669553427}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9692331569376884, "4": 0.030374841361552524, "3": 0.00038389671995610526, "2": 2.1827783939543566e-06, "1": 0}, "score": 4.9688506323904935}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5838550961338529, "4": 0.40066704832392275, "3": 0.015282498411558324, "2": 0.00015106324013261827, "1": 3.630456743329661e-05}, "score": 4.568166096802252}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5744801695750745, "4": 0.4194017868635112, "3": 0.0060788788480476055, "2": 2.572647347357815e-05, "1": 0}, "score": 4.568357475504182}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6186648318921911, "4": 0.37406870321584834, "3": 0.007227372682014611, "2": 3.4454532557529955e-05, "1": 0}, "score": 4.611371385488312}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8725427927294707, "4": 0.1266209374810032, "3": 0.0008226966629622989, "2": 2.0751149670691493e-06, "1": 0}, "score": 4.871725968951874}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9876517501253778, "4": 0.012323392420182343, "3": 1.649926043802749e-05, "1": 0, "2": 0}, "score": 4.987643505780967}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9680231032466802, "4": 0.03180785522647109, "3": 0.00016278227276086865, "2": 3.999501190457674e-07, "1": 0}, "score": 4.967865192090043}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8397565420892379, "3": 0.11124069520949773, "1": 0.046034677859352696, "4": 0.0029338647435505276, "5": 3.3801377563136596e-05}, "score": 2.0711751807724643}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6281794530935298, "2": 0.3137668452304088, "4": 0.04787328282546497, "1": 0.00935655136776044, "5": 0.0008214865443402292}, "score": 2.7170356342274644}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8158905442204032, "3": 0.12230687789153771, "1": 0.058700267211700866, "4": 0.003049700164245505, "5": 5.12151075554938e-05}, "score": 2.0698597538136134}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6736645447861519, "4": 0.1549202361502489, "2": 0.154519480996632, "1": 0.009259039142655485, "5": 0.0076302932546578285}, "score": 2.9971432450781927}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8472772043591119, "1": 0.0816283378275886, "3": 0.07017930584091667, "4": 0.0008963641590925528, "5": 1.867146752734006e-05}, "score": 1.9903997096171422}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7167802290086609, "4": 0.27765895471632357, "3": 0.005517629220443844, "2": 1.5054193013869358e-05, "1": 0}, "score": 4.711252500970332}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7688652134011751, "4": 0.22809866554860184, "3": 0.0030288523305719824, "2": 3.023833985889648e-06, "1": 0}, "score": 4.765833564278551}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9039519704812736, "4": 0.09480415894079115, "3": 0.0012046189332742053, "2": 2.9336387830036748e-06, "1": 0}, "score": 4.9027742712317215}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9583202372408292, "4": 0.04126039904137805, "3": 0.0004041231094748073, "2": 1.2725446509272695e-06, "1": 0}, "score": 4.95792694942667}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8868358329775479, "4": 0.11132872140918072, "3": 0.0018280850148537603, "2": 2.531073593441567e-06, "1": 0}, "score": 4.88500695997859}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6075606581168329, "5": 0.320363528953556, "3": 0.0709459755020784, "2": 0.000901266104909202, "1": 0.00013968257933695303}, "score": 4.2472179483964}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5746688598440093, "4": 0.3913791874748592, "3": 0.03349443075804589, "2": 0.0003419966555647236, "1": 0.00010132666026931345}, "score": 4.540194125798258}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5731167103635639, "5": 0.2382662102351316, "3": 0.1831406760263969, "2": 0.005011131705866605, "1": 0.0004599066609723571}, "score": 4.043723785392546}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7251855107223126, "4": 0.2512760106480068, "3": 0.023325642198542166, "2": 0.0001372013504213113, "1": 3.934730788711294e-05}, "score": 4.70149287951352}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5940071337568151, "5": 0.31888437586645285, "3": 0.0860101041081796, "2": 0.0008674150291909553, "1": 0.00021067582085583563}, "score": 4.230512092576713}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.563320185136437, "5": 0.30042137695185733, "3": 0.13197232994476754, "2": 0.003825420052829353, "1": 0.00044642711823856423}, "score": 4.159461199590331}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6454692547251311, "5": 0.17587680511069473, "3": 0.1716349227680222, "2": 0.006510550266433094, "1": 0.000507072787291499}, "score": 3.989699549085576}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6835503093776271, "5": 0.289995956268662, "3": 0.026271294493621783, "2": 0.00015958386093865268, "1": 1.7313474271327233e-05}, "score": 4.263355013282062}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6301850138072674, "5": 0.29737417043166925, "3": 0.0716854844692189, "2": 0.000683313636192177, "1": 5.677221638843814e-05}, "score": 4.224155159384768}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5806794880662977, "5": 0.34702536629235586, "3": 0.07070745260259634, "2": 0.001405588784890795, "1": 0.0001624083037627245}, "score": 4.273024888693274}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7132594070367764, "5": 0.22975678180231301, "3": 0.05667560543893957, "2": 0.0002680449145207412, "1": 3.718533852667901e-05}, "score": 4.17243404359089}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6809199823204349, "5": 0.22731960504394025, "3": 0.09116614207586787, "2": 0.000545331222608223, "1": 4.712664526596096e-05}, "score": 4.1349216651584655}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8298683543401519, "4": 0.16454170748015165, "3": 0.005574655819245136, "2": 8.601912463076093e-06, "1": 3.8271085028078525e-06}, "score": 4.824267365285093}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9046182386733344, "4": 0.093091211281345, "3": 0.0022812099430467975, "2": 4.330965766749655e-06, "1": 2.7171120174810966e-06}, "score": 4.902322283607473}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.530478791526307, "5": 0.4281779708870034, "3": 0.04115436838085202, "2": 0.0001568664110274052, "1": 2.1296602606775813e-05}, "score": 4.38665011942677}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.925839490271813, "4": 0.07301142815630954, "3": 0.001140482340908243, "2": 4.397721465148316e-06, "1": 2.5566825979537005e-06}, "score": 4.924684063385408}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8382211928902092, "4": 0.15498672668810565, "3": 0.0066845839948871805, "2": 7.342728214904927e-05, "1": 3.2855447409768864e-05}, "score": 4.8312921969258396}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9644395630793728, "4": 0.034244007263218156, "3": 0.001291225514943311, "2": 1.1406867176735788e-05, "1": 0}, "score": 4.963138812521414}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9894730859061859, "4": 0.010149013198939946, "3": 0.00036755668731852724, "2": 3.2794363331023007e-06, "1": 0}, "score": 4.989105958153511}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9741564489822545, "4": 0.02557029379278089, "3": 0.00025636637096567284, "2": 1.8036196420314618e-06, "1": 0}, "score": 4.973911168998054}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7111960847000502, "5": 0.27435582052789925, "3": 0.014408034162971508, "2": 2.4552128668698327e-05, "1": 0}, "score": 4.25990271280372}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9480732820255724, "4": 0.05156509442664176, "3": 0.00035044597511115004, "2": 5.523295267689321e-07, "1": 0}, "score": 4.947731801272235}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5578058032635518, "4": 0.4350116093885664, "3": 0.007121330521637239, "2": 1.311849488710121e-05, "1": 0}, "score": 4.550684744796859}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9461223218577136, "4": 0.05344074548003985, "3": 0.0004045828587682243, "2": 7.664012341270663e-07, "1": 0}, "score": 4.94574607607522}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6893173630587819, "4": 0.29871375657490234, "3": 0.01190441784834462, "2": 4.459142419724059e-05, "1": 0}, "score": 4.677337221793494}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5264237564263975, "4": 0.3946463624597259, "5": 0.039093170295392055, "2": 0.03740356343835557, "1": 0.0024297206186218376}, "score": 3.4305711738396356}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7040758550345071, "3": 0.23289187241900855, "5": 0.06076900537551487, "2": 0.0021447044964183594, "1": 0.00011539748475634905}, "score": 3.8232409720335294}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6042429480802208, "5": 0.27372536302053513, "3": 0.11968763160930578, "2": 0.0021364053612996626, "1": 0.00019722644940852192}, "score": 4.149174796559148}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6102742333311045, "3": 0.346764744049665, "5": 0.0336555029952162, "2": 0.009014649524589486, "1": 0.000290283362493628}, "score": 3.6679904150066065}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5956879636144049, "4": 0.3698682565972919, "3": 0.03404798587903611, "2": 0.0003684981008792979, "1": 2.6578232613134597e-05}, "score": 4.560823649269236}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6335721592658317, "5": 0.30370379837852574, "3": 0.06155752964747333, "2": 0.0010036897694830932, "1": 0.00013504277201027988}, "score": 4.239740420904907}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5661994656797682, "5": 0.34367552775620797, "3": 0.08927259724049223, "2": 0.0006791764477676421, "1": 0}, "score": 4.253088420855147}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7576891271169649, "5": 0.13411354326777994, "3": 0.10711406331694256, "2": 0.0009581582555036516, "1": 0}, "score": 4.025086301937967}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7703302037648992, "5": 0.17278388241909962, "3": 0.056380467577976975, "2": 0.0003800952419262248, "1": 0}, "score": 4.115657722167951}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6365991177584078, "3": 0.2580672936421238, "5": 0.09011759954320868, "2": 0.014325293900177477, "1": 0.000873455302742432}, "score": 3.8007759175985405}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5994177389657679, "4": 0.35211480710965815, "3": 0.04806378481028594, "2": 0.0003513467255478221, "1": 4.027724051631544e-05}, "score": 4.5505370602833315}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.48206604090086197, "5": 0.4663867935793243, "3": 0.05129665672406486, "2": 0.0002110897836637423, "1": 3.0356861103337834e-05}, "score": 4.414580643697009}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6363700151411877, "4": 0.3383812028251079, "3": 0.025027296243708752, "2": 0.00017569763909476582, "1": 3.394971835059565e-05}, "score": 4.610896706523694}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.660809024458786, "4": 0.32977664071621154, "3": 0.009381416636707043, "2": 2.1762831943114174e-05, "1": 0}, "score": 4.651391348660812}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8756745721901137, "4": 0.12018320405068629, "3": 0.004124368754985763, "2": 1.1740067429638798e-05, "1": 0}, "score": 4.871532052663676}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5701062340460014, "5": 0.3222080255346411, "3": 0.10406196915849632, "2": 0.0032490208661040236, "1": 0.00036463926797386515}, "score": 4.21055622580071}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4891615088950863, "3": 0.41402153069477327, "5": 0.055945644138910816, "2": 0.03330259357145306, "1": 0.007563249901593271}, "score": 3.5526267282128225}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6172729749397342, "3": 0.187341354698122, "5": 0.17455007775001444, "2": 0.016318394671521415, "1": 0.004496841578847981}, "score": 3.941080209579737}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5002416486552376, "5": 0.37853386822077945, "3": 0.11856831341447199, "2": 0.0022967098044997993, "1": 0.0003482964057688499}, "score": 4.254330085193716}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6196796673655911, "5": 0.23502718280894214, "3": 0.13947919899302533, "2": 0.004962269908942171, "1": 0.0008463657188367586}, "score": 4.083084788454177}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8655691946144861, "4": 0.1314057518891034, "3": 0.002970434620514961, "2": 1.6752098901354166e-05, "1": 0}, "score": 4.862597919599226}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9636587989713197, "4": 0.03513248071188948, "3": 0.0011740595909068294, "1": 9.45585908112387e-06, "2": 0}, "score": 4.9624806309992735}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9323578488462625, "4": 0.06607042898996116, "3": 0.0015279351962016019, "1": 1.1237243317828004e-05, "2": 0}, "score": 4.930826500066015}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9647245063978548, "4": 0.03386525555693088, "3": 0.0013125729291178544, "1": 1.279329950848059e-05, "2": 0}, "score": 4.963455323773742}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7508936713485822, "4": 0.24066472419545828, "3": 0.008288669643289035, "2": 9.010237807221581e-05, "1": 3.672973180339318e-05}, "score": 4.742333984677115}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5152850687021213, "5": 0.41913960013658197, "3": 0.06400823704986255, "2": 0.0012837189294172394, "1": 0.000271822303803068}, "score": 4.351752522070525}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6638655931169439, "4": 0.3267671634773876, "3": 0.009245304296260285, "2": 5.602906410438457e-05, "1": 0}, "score": 4.65455137220307}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5863011579506601, "4": 0.38951924710051566, "3": 0.02399739010913776, "2": 7.164487030803086e-05, "1": 0}, "score": 4.562222637418483}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8281722374378218, "4": 0.16885586462546706, "3": 0.002938619399297839, "2": 9.285565131634614e-06, "1": 0}, "score": 4.825234846745064}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5375838989991863, "5": 0.42586452488188237, "3": 0.036391665512272874, "2": 0.00013604443468043115, "1": 1.5366234817612544e-05}, "score": 4.389157979614167}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9782633178801264, "4": 0.02143660723366522, "3": 0.00029599855068105133, "2": 8.580255151187251e-07, "1": 0}, "score": 4.9779687506850365}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9794195624507801, "4": 0.020303414603716284, "3": 0.00027447661277687704, "2": 5.153198814883104e-07, "1": 0}, "score": 4.979146043856432}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9908404060114372, "4": 0.008994958727253559, "3": 0.00016278373780791598, "2": 4.70891090513557e-07, "1": 0}, "score": 4.990678048253671}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987643456503023, "4": 0.001226443697909222, "3": 3.836634530492189e-06, "1": 0, "2": 0}, "score": 4.998765876400828}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9746847067250856, "4": 0.02503033724493945, "3": 0.0002831397403601509, "2": 4.128981023384086e-07, "1": 0}, "score": 4.97440210865617}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7051711215641914, "5": 0.24544057943623257, "3": 0.04744272903093616, "2": 0.0016306590837994548, "1": 0.0003118394767968534}, "score": 4.193801609051128}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5420225138156111, "5": 0.4431087516555785, "3": 0.014691983119264828, "2": 0.00014118972566002616, "1": 3.273355039768867e-05}, "score": 4.428037398980703}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6154750194285628, "3": 0.2985760812697174, "2": 0.047352379840028956, "5": 0.030349771206678092, "1": 0.008243719840284663}, "score": 3.612336596730489}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9428241773979281, "4": 0.05667868867573874, "3": 0.0004905510043309617, "2": 1.776369292577377e-06, "1": 0}, "score": 4.942334603035952}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8008901118713289, "5": 0.13261934791455568, "3": 0.06397585707473989, "2": 0.0022177537936056194, "1": 0.0002930014500451199}, "score": 4.063329227653072}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7526223757498625, "4": 0.24142683800670287, "3": 0.005899614318222251, "2": 3.5950664139144544e-05, "1": 0}, "score": 4.746662225244026}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9862016392552225, "4": 0.013675334093549263, "3": 0.00011656832222385644, "2": 9.40983718357588e-07, "1": 0}, "score": 4.986088629557013}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987469818835858, "4": 0.0012361333962519732, "3": 1.268511879447802e-05, "1": 0, "2": 0}, "score": 4.998738491068324}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9891150218095355, "4": 0.01081173673714569, "3": 6.471574707879402e-05, "2": 4.598327502453467e-07, "1": 0}, "score": 4.989057364008529}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9947289563610439, "4": 0.005223365254695509, "3": 2.7289460297666298e-05, "2": 1.582599346015e-07, "1": 0}, "score": 4.994721474256825}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"5": 0.907534210529952, "4": 0.0911795171299466, "3": 0.0011902701271663246, "2": 1.9684640290671737e-06, "1": 0}, "score": 4.906425238037964}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8790868945847783, "4": 0.11867459823177892, "3": 0.0022175158413899306, "2": 3.5491266458400166e-06, "1": 0}, "score": 4.876877575177648}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8709309168747108, "4": 0.12488882967467461, "3": 0.004123959637897811, "2": 1.1762453574124903e-05, "1": 0}, "score": 4.866822033092933}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9520332388898658, "4": 0.047032421309001864, "3": 0.0009166856015030108, "2": 1.7785022152261066e-06, "1": 0}, "score": 4.951128096105788}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9392285989892962, "4": 0.05907817571568993, "3": 0.0016657779956986555, "2": 2.8536091398150124e-06, "1": 0}, "score": 4.9375801723315895}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7496003358642955, "4": 0.23253712250777256, "3": 0.017632743134137072, "2": 0.00016418281916623316, "1": 3.750096094935871e-05}, "score": 4.731547291451619}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6483613235233618, "4": 0.33948755143659315, "3": 0.012072192640677295, "2": 2.1543379594623116e-05, "1": 0}, "score": 4.636282559755899}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8784971636399332, "4": 0.11857552258708422, "3": 0.0027595324935375874, "2": 1.663244919328494e-05, "1": 0}, "score": 4.875836747947953}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9712362504027215, "4": 0.02809590620248746, "3": 0.0006565828976947608, "2": 3.0547493943952006e-06, "1": 0}, "score": 4.970581522353333}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.981188138931455, "4": 0.018393611053815248, "3": 0.0003952891640511639, "2": 1.0417360058952223e-06, "1": 0}, "score": 4.980812264831897}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"3": 0.589723462256589, "4": 0.3385347273554405, "2": 0.06364083213105899, "5": 0.006361313485981309, "1": 0.0017327491980248843}, "score": 3.2841529888810053}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5974265688805535, "4": 0.32896010400249404, "2": 0.06083896643397853, "5": 0.01110231870651518, "1": 0.0016683369284004506}, "score": 3.2869901644370967}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5021638088844169, "3": 0.47402840638521704, "2": 0.015319388968925348, "5": 0.008232883180040729, "1": 0.0002549969432838118}, "score": 3.502800451652083}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5567015720076016, "4": 0.382517241849788, "2": 0.0538995257396078, "5": 0.005741579111226838, "1": 0.0011375839587191427}, "score": 3.3378265500806066}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5730096621606815, "4": 0.38666609577302485, "2": 0.030104723278090478, "5": 0.009255056760688093, "1": 0.000956882072817771}, "score": 3.3731605504107427}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4911383102098228, "4": 0.48205054754728693, "3": 0.02626166520221738, "2": 0.0003357076050266519, "1": 0.00012170943917108227}, "score": 4.463882806529573}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9445216217798034, "4": 0.05454886901037639, "3": 0.0009132398559391606, "2": 4.276318850978491e-06, "1": 0}, "score": 4.943611146047692}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8555888702341267, "4": 0.14274290984725282, "3": 0.0016316666530712494, "2": 7.085047362119557e-06, "1": 0}, "score": 4.853968198407527}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8904098737188669, "4": 0.10768818540016507, "3": 0.0018870592764991408, "2": 7.774199992875658e-06, "1": 0}, "score": 4.888513581067785}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9519360031807578, "4": 0.047402419845090804, "3": 0.0006407464712201167, "2": 1.961023553222322e-06, "1": 0}, "score": 4.951309285373374}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"3": 0.47032083006292136, "4": 0.3850452804698716, "2": 0.0781816432527721, "5": 0.05932789967873561, "1": 0.007091656690051838}, "score": 3.411349570148422}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6651261680041602, "4": 0.33083890960557233, "3": 0.003987159126669495, "2": 1.2729645415816243e-05, "1": 0}, "score": 4.66113671159778}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.585873982183252, "5": 0.22364021532599423, "3": 0.17226946002464152, "2": 0.01545343454030619, "1": 0.0027307652437461244}, "score": 4.012271984944013}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6954258133156692, "4": 0.2654938771892896, "3": 0.03774866379773687, "2": 0.0011332858884916704, "1": 0.00010453569143918476}, "score": 4.655158440329035}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5137751554452973, "3": 0.25236074180814405, "5": 0.14188213517907067, "2": 0.08220409176466112, "1": 0.009753413038467326}, "score": 3.6958455302670803}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4869750252834879, "4": 0.4824302298529088, "3": 0.03004573975294797, "2": 0.0003285399874666003, "1": 0}, "score": 4.456372819845553}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8367098109344645, "4": 0.15981135349816758, "3": 0.0032954518118096434, "2": 1.0199886144910746e-05, "1": 0}, "score": 4.833538314741016}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5010141874674121, "5": 0.4846354597699108, "3": 0.014244320686852623, "2": 5.5573060361535016e-05, "1": 0}, "score": 4.470303724025217}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.680742462388524, "4": 0.3089723772788022, "3": 0.01016642149066463, "2": 5.308315031187644e-05, "1": 0}, "score": 4.670513897650979}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9646557259219819, "4": 0.035057651040777654, "3": 0.00022054208932508195, "2": 7.532437171197455e-07, "1": 0}, "score": 4.964496685699407}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6694479108096401, "3": 0.2308947961779881, "5": 0.08909090731941566, "2": 0.00982233897647709, "1": 0.0007061496317069997}, "score": 3.836426785345369}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6319528196970453, "5": 0.30404824181042384, "3": 0.0636066470965869, "2": 0.0003540198758279542, "1": 3.0054895453057312e-05}, "score": 4.239645359351791}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6938156623277567, "5": 0.26804237373982664, "3": 0.03795490251321651, "2": 0.00013742640781880784, "1": 0}, "score": 4.229824025729106}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7221700799740222, "5": 0.2358734845772042, "3": 0.04177175021942668, "2": 0.0001593065857651198, "1": 1.7432626871603507e-05}, "score": 4.193732362706223}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7032797703363679, "3": 0.15661136885628152, "5": 0.1386029095531088, "2": 0.0014392296123166273, "1": 5.706480534926077e-05}, "score": 3.9789416836994276}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6007578905219279, "5": 0.3261831648594466, "3": 0.06843302152613907, "2": 0.003940794209384854, "1": 0.0006487187462382136}, "score": 4.247931425892973}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6468330402152381, "4": 0.34889233502662165, "3": 0.004229338420199858, "2": 1.8014780466300034e-05, "1": 0}, "score": 4.642585196533225}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7161209727057869, "4": 0.2784245143445239, "3": 0.00535509036682886, "2": 2.6704218734556015e-05, "1": 0}, "score": 4.710764159508448}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9480968590051048, "4": 0.051577982153993444, "3": 0.00030733045150547106, "2": 1.0833212545489704e-06, "1": 0}, "score": 4.94780323294081}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7685550081272868, "4": 0.2281466853716089, "3": 0.0032775732277928746, "2": 7.1952390047810285e-06, "1": 0}, "score": 4.765273404719092}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7594112325085308, "3": 0.20952095934874357, "5": 0.02880310169200928, "2": 0.002194765657749027, "1": 5.985198262156136e-05}, "score": 3.8147111857361966}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8244104699183165, "5": 0.13649014019086636, "3": 0.03810883248359664, "2": 5.277895638552424e-05, "1": 0}, "score": 4.098367997182508}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7824033410597543, "3": 0.1258376996950339, "5": 0.09037545174085647, "2": 0.0013369331260854379, "1": 4.2931402791913185e-05}, "score": 3.961734952186645}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7189515994558741, "5": 0.21688530794090222, "3": 0.06359624190029016, "2": 0.0005268337626904057, "1": 2.9297276455468385e-05}, "score": 4.152149137673466}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7752117043723645, "4": 0.2233397554349033, "3": 0.0014161005165016977, "2": 2.204561356825032e-06, "1": 0}, "score": 4.773814591106203}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5951933906164265, "5": 0.36272300776756744, "3": 0.041816879716344034, "2": 0.00017672512475150397, "1": 0}, "score": 4.320581529105436}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9478621335951432, "4": 0.0503826252723439, "3": 0.0017323046316209797, "2": 7.367464063887528e-06, "1": 0}, "score": 4.9461298243654745}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7769562783636085, "5": 0.15269090954447276, "3": 0.07008695454842079, "2": 0.00023544740565542387, "1": 1.8207535702290423e-05}, "score": 4.082079439160374}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6659677387036042, "4": 0.3280983723048856, "3": 0.005876105890414002, "2": 8.746980525058475e-06, "1": 0}, "score": 4.660106507914452}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6118965908169948, "5": 0.3487359616465413, "3": 0.039257765782228976, "2": 8.728115353845884e-05, "1": 0}, "score": 4.309310562299633}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5188848963943354, "4": 0.3905365172461176, "2": 0.07901038337700471, "5": 0.009344739633934406, "1": 0.0021955076139248747}, "score": 3.32583370682979}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.667837098303814, "3": 0.26671342809473936, "5": 0.05422953460714175, "2": 0.010473971543488237, "1": 0.0006774376763968256}, "score": 3.764519712985285}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.49979003437788094, "4": 0.4013077257852955, "2": 0.08060903008105424, "5": 0.014857403288738543, "1": 0.0034141500643361453}, "score": 3.3435926431336886}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6667871296209579, "5": 0.22095849511752708, "3": 0.10721724239954403, "2": 0.004631043770027037, "1": 0.00032107108845223607}, "score": 4.103524753380417}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.46875796961345917, "4": 0.4597615286046128, "2": 0.056064868083095104, "5": 0.013733680946180698, "1": 0.0016700428403137802}, "score": 3.42782903213952}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5723868299715423, "5": 0.4094301762481436, "3": 0.01787248320563549, "2": 0.000236671844184595, "1": 5.2012005033471953e-05}, "score": 4.390936846210253}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9868064036885976, "4": 0.013176082826003493, "3": 1.619697599703585e-05, "1": 0, "2": 0}, "score": 4.986791505832896}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9427645305703488, "4": 0.05714119322019569, "3": 8.667838614577131e-05, "2": 1.002347401801881e-07, "1": 0}, "score": 4.942684719576902}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9619149584534971, "4": 0.03799889114789719, "3": 7.400073739592176e-05, "2": 6.38203328921349e-08, "1": 0}, "score": 4.961852454871152}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9631789200473198, "4": 0.03674842174352164, "3": 6.241268612293715e-05, "2": 8.58329389739104e-08, "1": 0}, "score": 4.96312612075823}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"3": 0.44536242058578024, "4": 0.26765088917298313, "2": 0.2388559090181535, "1": 0.026110576940012495, "5": 0.02199058218010253}, "score": 3.0205555995350957}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7285062675651612, "3": 0.1449265669022581, "5": 0.12231492594888113, "2": 0.004056004107485921, "1": 0.00018792567857974703}, "score": 3.968712313801571}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6352161273287869, "5": 0.3251205637689969, "3": 0.03935923275505066, "2": 0.0002721987663235041, "1": 0}, "score": 4.285226025739948}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6244278428295891, "5": 0.34184512341542816, "3": 0.03328120685549141, "2": 0.00030994738521590586, "1": 0}, "score": 4.307985870760028}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7209677516148857, "5": 0.2235559412112924, "3": 0.05469056886774535, "2": 0.0007535316023756308, "1": 2.349993271522912e-05}, "score": 4.167289265889976}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7432161658776154, "3": 0.19241992227176782, "5": 0.06133077026941954, "2": 0.002955450163892083, "1": 7.240291477932846e-05}, "score": 3.86278201324786}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.61247262588172, "5": 0.32956581597287016, "3": 0.05717325842304064, "2": 0.0006541224445164749, "1": 8.925938399772437e-05}, "score": 4.270828699563584}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8540609651312844, "3": 0.08015936206084835, "5": 0.06520515817925855, "2": 0.000537003470886772, "1": 0}, "score": 3.9839711879173385}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6406132424964877, "5": 0.2794961670714435, "3": 0.07792953952286166, "2": 0.0018498870422486628, "1": 0.00010900170866852142}, "score": 4.197540275451423}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5585920989220131, "5": 0.3632541325486633, "3": 0.0763495760538678, "2": 0.001596071470407622, "1": 0.0001135891007934213}, "score": 4.28339843644546}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6743862236961146, "5": 0.23078085462968218, "3": 0.09189778979670175, "2": 0.002692649300393305, "1": 0.00023533359435088958}, "score": 4.132792714781969}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8432040146492142, "4": 0.14861650245564853, "3": 0.00805966086219171, "2": 9.417064962855225e-05, "1": 1.9018012529956774e-05}, "score": 4.834904496681275}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8183898309068981, "4": 0.1779980827171551, "3": 0.003570055989429449, "2": 2.4870604352047533e-05, "1": 0}, "score": 4.814784015224977}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972086500821193, "4": 0.00273149172391854, "3": 5.203016039115427e-05, "1": 1.0968336818174615e-06, "2": 0}, "score": 4.9971600415042445}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.666109265224354, "4": 0.30761816165559847, "3": 0.025673247052169498, "2": 0.0004514478931829253, "1": 0.00014577802061408599}, "score": 4.639097130526423}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9838687804730538, "4": 0.016049819107987487, "3": 7.577917797134662e-05, "2": 1.4508225202637895e-07, "1": 0}, "score": 4.98379809856513}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9769254420537697, "4": 0.02299288175195593, "3": 7.58842048471596e-05, "2": 3.275765725130705e-07, "1": 0}, "score": 4.976854240630647}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9669336404794269, "4": 0.03293340127145899, "3": 9.701907008203825e-05, "2": 1.793450917899942e-07, "1": 0}, "score": 4.966870837859765}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938830978884463, "4": 0.00608533804661159, "3": 1.869149407283992e-05, "1": 0, "2": 0}, "score": 4.993877200149067}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9943463324727, "4": 0.005638098588566211, "3": 1.1482458901294817e-05, "1": 0, "2": 0}, "score": 4.994338913359715}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5584017464177022, "5": 0.4166042119119751, "3": 0.024619868485871187, "2": 0.0002614537903544387, "1": 0}, "score": 4.391505566115594}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6243334676937259, "4": 0.35748935268174287, "3": 0.018013436992407504, "2": 0.00011481964098423088, "1": 2.5371755267755585e-05}, "score": 4.606028548874845}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5728079180614165, "5": 0.3033723348427252, "3": 0.1213156684876706, "2": 0.002328013383973411, "1": 0.00016816599515138544}, "score": 4.176897538955835}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6504671577538325, "4": 0.3255518293680159, "3": 0.0236736609777371, "2": 0.00023485787829076473, "1": 6.312826177629524e-05}, "score": 4.626140260513809}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6736398419602236, "4": 0.296165458325581, "3": 0.0299831386597889, "2": 0.00017581363781193424, "1": 1.849929379225941e-05}, "score": 4.643260673182519}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6542272047385271, "4": 0.3359038569481741, "3": 0.009829910988013706, "2": 2.8087413503351972e-05, "1": 6.979941655749997e-06}, "score": 4.644322730597304}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9893847378198465, "4": 0.010521413684972947, "3": 9.320594973052057e-05, "2": 1.5246176403129813e-07, "1": 0}, "score": 4.989291711782316}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.937924953599678, "4": 0.05960014929287261, "3": 0.002456709072659041, "2": 1.2691907148755908e-05, "1": 3.538488144029938e-06}, "score": 4.935434076490985}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9632294661137485, "4": 0.03559399269092744, "3": 0.0011596341633823308, "2": 9.357204281170744e-06, "1": 0}, "score": 4.962058380916779}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9840424722555912, "4": 0.015622579614978675, "3": 0.00032899434361706345, "1": 1.7027209970082463e-06, "2": 0}, "score": 4.9837125515748}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7205857615661362, "5": 0.23820207760397577, "3": 0.04090155079107494, "2": 0.0002616502158995549, "1": 0}, "score": 4.1967868610309695}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5687697636761598, "5": 0.2623590483056763, "3": 0.16598364824926218, "2": 0.0027562486736077, "1": 0.00012227646138314615}, "score": 4.0904968891213755}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7330880951043918, "5": 0.2310542147753395, "3": 0.035689562496105214, "2": 0.0001390429054723746, "1": 0}, "score": 4.1950922406712285}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4944164009234626, "5": 0.4859812189325774, "3": 0.019524490077239755, "2": 5.469807724873168e-05, "1": 0}, "score": 4.466358148474109}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5235552576456883, "4": 0.4509920622350905, "3": 0.02527490683843253, "2": 0.00013672143818670087, "1": 0}, "score": 4.498027352871384}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9293585239701684, "4": 0.06822347262225044, "3": 0.0023761629456837494, "2": 1.687649048616565e-05, "1": 0}, "score": 4.926971748939752}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9779570901618427, "4": 0.021787640924968807, "3": 0.0001975547098668069, "2": 3.5455796228839046e-07, "1": 0}, "score": 4.977814913452715}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9547583854881736, "4": 0.04472350842766683, "3": 0.0004405487275399216, "2": 8.654052003389045e-07, "1": 0}, "score": 4.954389299928057}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9882403822054306, "4": 0.011717783896990795, "3": 3.837516701054742e-05, "1": 0, "2": 0}, "score": 4.988205424974731}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916977496270535, "4": 0.008248155330004761, "3": 4.939719088813022e-05, "1": 0, "2": 0}, "score": 4.991653011075299}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5844108109773047, "4": 0.37529417270252885, "3": 0.0350695621478232, "2": 0.0029945748821811015, "1": 0.0022005520902212677}, "score": 4.536766721426138}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7358901530244698, "4": 0.24633250730565537, "3": 0.01676038856714087, "2": 0.0005830517561480393, "1": 0.00041333754440854906}, "score": 4.7167383857447085}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7374322569279805, "4": 0.25236445153831505, "3": 0.010012733960692364, "2": 0.0001256663725045138, "1": 4.795737319746446e-05}, "score": 4.727036629615421}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9439542745372452, "4": 0.0537826152850332, "3": 0.0021813594404499286, "1": 3.4718183086477764e-05, "2": 3.313527940955008e-05}, "score": 4.9416155758791085}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9561700224430449, "4": 0.04181355958790541, "3": 0.0019049883231544028, "1": 4.96672398574248e-05, "2": 3.592796846165512e-05}, "score": 4.954068824294879}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6091417985703065, "4": 0.25129352519632386, "2": 0.11038714413193998, "5": 0.01978347471730111, "1": 0.009378800524440874}, "score": 3.1617181967619423}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5552444010024996, "4": 0.3563629660428411, "2": 0.04664080393780564, "5": 0.03318804029623357, "1": 0.008527619758249408}, "score": 3.3590559898635903}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6240045618390055, "3": 0.30055870089725584, "5": 0.06697882863828758, "2": 0.007601455780252445, "1": 0.0008103364712063518}, "score": 3.7487746211633812}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7603118050779584, "4": 0.22082825638695644, "3": 0.018727075773411216, "2": 9.858829651530736e-05, "1": 2.109150932766374e-05}, "score": 4.741334051157586}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5594523277243497, "5": 0.36423842938433787, "3": 0.07453611544398142, "2": 0.0016283175095200943, "1": 0.00013967824924411012}, "score": 4.286028111980775}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5477950271780719, "5": 0.4442733290451434, "3": 0.007869093558475263, "2": 3.3252121113828296e-05, "1": 0}, "score": 4.436350515484254}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9530469367183368, "4": 0.04661604890679947, "3": 0.00033164945675532713, "2": 7.657416466576353e-07, "1": 0}, "score": 4.95271813749712}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6986958661003908, "4": 0.2981383614687583, "3": 0.0031283245665411187, "2": 1.4351070776084433e-05, "1": 0}, "score": 4.695554904480318}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8345703061485265, "4": 0.16394653670619808, "3": 0.0014752566563828427, "2": 4.044915086041985e-06, "1": 0}, "score": 4.833090171702616}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9256459924504609, "4": 0.07388706501312889, "3": 0.0004611311800605357, "2": 1.1827953267286884e-06, "1": 0}, "score": 4.925186777963206}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9249374864219827, "4": 0.07360301422072242, "3": 0.0013685424645070478, "2": 1.3316176281723748e-05, "1": 0}, "score": 4.923614021659328}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9955000468660367, "4": 0.0044223059977171846, "3": 5.2652438772063594e-05, "1": 0, "2": 0}, "score": 4.995472275955646}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9788435521009571, "4": 0.020693182102355816, "3": 0.0003743084005293378, "2": 1.1600725635708661e-06, "1": 0}, "score": 4.978552837875461}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.981668095546916, "4": 0.017854048317005933, "3": 0.0004470227811982636, "2": 1.6569997009444163e-06, "1": 0}, "score": 4.98124638795945}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9757623510449875, "4": 0.023610961604940067, "3": 0.0005230687758310627, "2": 1.6155146230582223e-06, "1": 0}, "score": 4.975335538448986}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5535621763942854, "5": 0.3280460447877334, "3": 0.11434520409157568, "2": 0.0032667087480518662, "1": 0.0007687651743857383}, "score": 4.204863401825361}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6228377048443803, "4": 0.3557279947014401, "3": 0.021339343444636165, "2": 5.8561152958854835e-05, "1": 0}, "score": 4.60140312767581}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6081016156363243, "4": 0.3385718666520846, "3": 0.05191673467664557, "2": 0.0010431200593003901, "1": 0.0003568014833128875}, "score": 4.553033690128634}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.635557107548852, "4": 0.3433783082852772, "3": 0.020751598481904256, "2": 0.00024881373341731203, "1": 5.149488889381319e-05}, "score": 4.614161182692611}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.48517341269629316, "5": 0.48308836101566716, "3": 0.03128500718090351, "2": 0.00031638364952567624, "1": 7.223455683840136e-05}, "score": 4.450983016774314}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4451462229015621, "4": 0.29629387388382633, "2": 0.14692306449382564, "1": 0.08158025657706794, "5": 0.0300359824813429}, "score": 3.0462832146171452}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7683770390816758, "4": 0.2145606349802674, "3": 0.016131812901681412, "1": 0.00048171013715950966, "2": 0.0004142420885872092}, "score": 4.749997532114021}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6805204063850249, "4": 0.29443738885630616, "3": 0.024600965225613662, "2": 0.00035468765530153495, "1": 7.860777066448014e-05}, "score": 4.654979445763673}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5209121132697652, "4": 0.4649660438684386, "3": 0.01402806939253822, "2": 7.269764989596866e-05, "1": 1.613377753705982e-05}, "score": 4.5066927513415935}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7652849736092608, "4": 0.20836346424406665, "3": 0.025667481488378625, "2": 0.00047565155457505185, "1": 0.00019647232033740848}, "score": 4.738085597180323}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9020035709524696, "4": 0.09400948476942352, "3": 0.0038792711148178563, "2": 6.840388067024729e-05, "1": 3.5036891805901785e-05}, "score": 4.89788618160612}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9981650250289458, "4": 0.0017132296595572794, "3": 9.544627826635555e-05, "1": 4.635268183975169e-06, "2": 0}, "score": 4.998077295058146}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9730067320119251, "4": 0.024021111246878026, "3": 0.0027790865066746914, "1": 0.00010230448953469563, "2": 8.610216514350656e-05}, "score": 4.969753050227139}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9780781785249961, "4": 0.021279474699228678, "3": 0.0006210301043447875, "1": 9.69719392876932e-06, "2": 8.001776327455022e-06}, "score": 4.977415589283735}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9800453626210179, "4": 0.018909379692429833, "3": 0.0010131459369250196, "1": 1.1407574424425196e-05, "2": 1.1287258892784091e-05}, "score": 4.978984638459443}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4772489101418241, "3": 0.3644928294564645, "1": 0.09221942383001382, "4": 0.0607177622599652, "5": 0.005319239164754358}, "score": 2.409667399440534}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.47584448039270444, "3": 0.3900060410915812, "5": 0.08891533981479717, "2": 0.04276176144148863, "1": 0.0024606961039025104}, "score": 3.605999085142567}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5300370548863474, "2": 0.22246368592984442, "4": 0.1987885464201746, "5": 0.024749440408020303, "1": 0.023956705863875525}, "score": 2.9779102287058614}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.552899627145514, "4": 0.241425099739727, "2": 0.17633214058201405, "5": 0.017198666968457815, "1": 0.012140952946678022}, "score": 3.075208651380506}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5357198084604281, "2": 0.23862822072814172, "4": 0.19711487467795488, "5": 0.015052612722959987, "1": 0.013480056258870119}, "score": 2.961631597015255}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8563823260275002, "4": 0.1410917487306763, "3": 0.0024687834007219613, "2": 9.323131386699106e-06, "1": 0}, "score": 4.853935730468814}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9960925165589268, "4": 0.003862371136628493, "3": 3.227134090768446e-05, "1": 0, "2": 0}, "score": 4.996073035755551}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9152297484706384, "4": 0.08415131766007501, "3": 0.0006103390106546937, "2": 1.5459251874675091e-06, "1": 0}, "score": 4.914622764724605}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.908333833419024, "4": 0.09111027435598096, "3": 0.0005026527420199506, "2": 9.48760918502273e-07, "1": 0}, "score": 4.907876756686312}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9088113101002364, "4": 0.09036908953300626, "3": 0.0007912251428807353, "2": 3.0693553565321697e-06, "1": 0}, "score": 4.908036924909676}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4028504007388351, "2": 0.3465165493572285, "1": 0.13809475486369713, "4": 0.10475001258884421, "5": 0.007784814514434454}, "score": 2.497611840282622}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6356747791281062, "5": 0.3286709765165725, "3": 0.03516102690376294, "2": 0.00043581064910085343, "1": 5.0374347028239914e-05}, "score": 4.292489262191224}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7020591284093497, "3": 0.2198811293043103, "5": 0.06670149583501206, "2": 0.010854544920740696, "1": 0.0004993486543909496}, "score": 3.823612462932936}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7516713012422445, "5": 0.1524993873987677, "3": 0.09344423852539228, "2": 0.002195992874726897, "1": 0.00018593972423938893}, "score": 4.054105513855212}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8315967093638795, "5": 0.08705915925327584, "3": 0.08067673784245111, "2": 0.0006332153425949109, "1": 1.917551218472294e-05}, "score": 4.005058540080768}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.482031940755265, "5": 0.37050001268814153, "3": 0.13213607713617626, "2": 0.011989063736770044, "1": 0.0033337669437209193}, "score": 4.204386375081189}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4205198605028188, "4": 0.31033457168161416, "2": 0.18535379033233795, "1": 0.045534272263731204, "5": 0.03825545938021048}, "score": 3.1104233814907274}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.30944107274283217, "3": 0.2616392846482086, "1": 0.21183345556559496, "4": 0.15034599616479372, "5": 0.06673854546152602}, "score": 2.55071436395158}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.2826363471648125, "5": 0.26064313659409977, "4": 0.1796820102696487, "3": 0.1441611655559151, "2": 0.1328743943996534}, "score": 3.002821203039878}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7928865752888794, "4": 0.18381716203451823, "3": 0.021652499085378377, "2": 0.00102802067529165, "1": 0.000595245281232248}, "score": 4.767408029058667}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5899601421749704, "3": 0.3690552563302525, "5": 0.024490387141422265, "2": 0.01604244911871878, "1": 0.0004414688920877715}, "score": 3.6220219341058266}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8145968587193269, "3": 0.10782103604289546, "5": 0.07698100314265685, "2": 0.0005528084498949585, "1": 2.507914333699575e-05}, "score": 3.967978369403756}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7208579710045776, "3": 0.19666006482507142, "5": 0.07621736157881283, "2": 0.006066593706748208, "1": 0.0001844112942634897}, "score": 3.8668690651975166}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7925376551298822, "3": 0.12611724358990326, "5": 0.07940806036098597, "2": 0.0018434084545978307, "1": 8.207328420531072e-05}, "score": 3.949357194619946}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4933354551113252, "4": 0.45367126006436753, "2": 0.029775522964974124, "5": 0.02151131506915917, "1": 0.0016988369654835132}, "score": 3.463524220644804}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8688426068250891, "4": 0.127460750626385, "3": 0.0036777982775304356, "2": 7.13609392954951e-06, "1": 0}, "score": 4.865160665813965}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.758365757527604, "4": 0.23402465638703826, "3": 0.007555670031719776, "2": 2.4849523019305398e-05, "1": 0}, "score": 4.7507822110839735}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8646891852783511, "4": 0.1305918589292098, "3": 0.004669521383624978, "2": 1.4887553941721225e-05, "1": 0}, "score": 4.860019599759143}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.95238961353408, "4": 0.04704912078254773, "3": 0.0005571489160496899, "2": 1.1792003720510292e-06, "1": 0}, "score": 4.951832902290161}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9895677483768195, "4": 0.01027911615285621, "3": 0.0001460901004836367, "2": 3.0711363846017406e-07, "1": 0}, "score": 4.98942771106647}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6284630144615208, "5": 0.2143006378654577, "3": 0.15534143161858224, "2": 0.0017262143588998209, "1": 0.00016495151099670392}, "score": 4.055012129301722}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7178828390925576, "4": 0.2669547261342303, "3": 0.015101916842589791, "2": 5.4495577847498935e-05, "1": 5.531115748181158e-06}, "score": 4.702655682917516}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7179612864362778, "3": 0.18184647351700461, "5": 0.0983990233773612, "2": 0.001691705647721165, "1": 0.00010075114423809892}, "score": 3.9128668189216658}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7768311984719934, "4": 0.21997541255261338, "3": 0.0031856497742877242, "2": 6.802026333172774e-06, "1": 7.213520778910752e-07}, "score": 4.773629947555706}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7106827011679336, "3": 0.23830235796095994, "5": 0.0471565481705723, "2": 0.003698492406751892, "1": 0.00015664397544552656}, "score": 3.8009866254188713}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7739899577188728, "5": 0.1452670509178059, "3": 0.07977790440676215, "2": 0.000846691293696255, "1": 0.00010677668078378206}, "score": 4.063476171409798}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5430967869980445, "3": 0.41872759573356405, "5": 0.02879394952064862, "2": 0.00909161244350206, "1": 0.0002762669360619294}, "score": 3.5910486893206555}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.733270422121484, "5": 0.22073535140524783, "3": 0.04588249074236449, "2": 0.00010451353222155958, "1": 4.934523228396019e-06}, "score": 4.174629429524215}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6917927931965583, "3": 0.20612574166018616, "5": 0.09982353518197683, "2": 0.002160193452400304, "1": 8.434702662822077e-05}, "score": 3.889122880949888}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.782734571191179, "5": 0.12282609326127648, "3": 0.09339127065995727, "2": 0.0008535862212801457, "1": 0.00014395583598172864}, "score": 4.0272971617806865}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4732745097281329, "5": 0.4396166639924285, "3": 0.0811387034908376, "2": 0.0048013684881698816, "1": 0.0011568693019841476}, "score": 4.345408720801409}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7710915812865958, "4": 0.21820523808111827, "3": 0.010415777032448344, "2": 0.00017174735968381196, "1": 6.01932703562749e-05}, "score": 4.760193892334602}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.48128700636194777, "5": 0.3599904772374642, "3": 0.13793785794347418, "2": 0.013512132411177118, "1": 0.007072883727401462}, "score": 4.173844409990506}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7753307627754705, "4": 0.21098266611381897, "3": 0.013320013504753833, "2": 0.00024157489710813256, "1": 8.22731293456879e-05}, "score": 4.761313295459182}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5785533588742221, "5": 0.31262921727227866, "3": 0.10046695615754922, "2": 0.006727298012288336, "1": 0.0016025278343357707}, "score": 4.193904084126035}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8719338657317993, "4": 0.12424053425075414, "3": 0.0037832430024964444, "2": 1.3080382097693585e-05, "1": 0}, "score": 4.868149878470359}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8790609179508501, "4": 0.11623601997800447, "3": 0.004632833551103211, "2": 2.2584279298350587e-05, "1": 0}, "score": 4.8744245771362165}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.977542485148098, "4": 0.021921852688789562, "3": 0.0005244788788773706, "2": 1.5343603099081068e-06, "1": 0}, "score": 4.97702436478237}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9860121129655917, "4": 0.01376449676613393, "3": 0.00022017651332802886, "2": 9.79678872601331e-07, "1": 0}, "score": 4.9857921794292395}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8920583765328274, "4": 0.10407473834548567, "3": 0.0038295996931953426, "2": 2.1484990132743498e-05, "1": 9.716539707934753e-06}, "score": 4.888162060728206}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7890495650662877, "3": 0.1689308194894419, "5": 0.04029254156445093, "2": 0.001682470550527107, "1": 2.9420407257729516e-05}, "score": 3.867906514187086}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7291096986764731, "3": 0.23555788489405835, "5": 0.030512873574850954, "2": 0.004646162820222163, "1": 0.00013624851821040804}, "score": 3.7852459433419865}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8568414785622561, "5": 0.10089894576422521, "3": 0.0420826010684428, "2": 0.00015470569312435258, "1": 0}, "score": 4.058508236224295}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6629982687741903, "5": 0.27897396972222355, "3": 0.057663378212224954, "2": 0.000328580071790165, "1": 2.539068965883508e-05}, "score": 4.220579556088668}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6902529599169819, "3": 0.26367386483396443, "5": 0.04108453934108689, "2": 0.0047739482074676395, "1": 0.00020258074705678257}, "score": 3.767252217984456}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9641587803771312, "4": 0.03558812728425476, "3": 0.00020882603939191674, "2": 1.0373818197545041e-06, "1": 0}, "score": 4.963989551798812}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9636547063210912, "4": 0.03608846838471816, "3": 0.00022100284129294572, "2": 2.1283851740944163e-06, "1": 0}, "score": 4.963461909660284}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9806744879939353, "4": 0.01916859914448081, "3": 0.0001505867843152267, "2": 1.0431109622713874e-06, "1": 0}, "score": 4.980526995078774}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984764246211988, "4": 0.0015074778841768497, "3": 4.151109126630793e-06, "1": 0, "2": 0}, "score": 4.99848420178926}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9714113664863764, "4": 0.028397206537738702, "3": 0.00018992562686273928, "2": 1.1949765454642318e-06, "1": 1.5981850648909357e-07}, "score": 4.971218713786862}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5889033502802462, "5": 0.3824429450918649, "3": 0.028368412180113687, "2": 0.00019292462295172427, "1": 0}, "score": 4.3537213561381085}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7497229805113015, "4": 0.2451241407073929, "3": 0.005086864754448741, "2": 1.5465474037773297e-05, "1": 0}, "score": 4.744642825425969}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8657289068638945, "4": 0.13271168310962467, "3": 0.0015457830013814707, "2": 2.9494731405102267e-06, "1": 0}, "score": 4.864186452311978}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9696904879409395, "4": 0.030183978760134213, "3": 0.000108592306012999, "1": 0, "2": 0}, "score": 4.969598321593222}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7623287544890891, "4": 0.23404192804399593, "3": 0.003497107782351407, "2": 9.959088565927916e-06, "1": 0}, "score": 4.758904505057655}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3250642902700204, "2": 0.2813100323175961, "1": 0.17227652321729697, "4": 0.15930239940520513, "5": 0.06204268270940316}, "score": 2.657523291479102}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5231199454538182, "5": 0.3057075661947225, "3": 0.15632429740336473, "2": 0.012406331895101083, "1": 0.00243341806224846}, "score": 4.117271340700712}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7071542934853104, "4": 0.20094440524545265, "3": 0.07935323215079676, "2": 0.008615479946422875, "1": 0.003930785501176608}, "score": 4.598778824938044}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8532557604768524, "2": 0.06594728949875217, "3": 0.035667209987855726, "5": 0.025771596612229334, "4": 0.019346410124491734}, "score": 1.2984108276405657}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4944804567173267, "5": 0.4151365818523416, "3": 0.08419224197861701, "2": 0.004285330501650435, "1": 0.0018977777169690558}, "score": 4.3166827560657905}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8912309873925952, "4": 0.10737874731090763, "3": 0.0013817335120223067, "2": 5.7361058569464256e-06, "1": 0}, "score": 4.889840269376274}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9416940583306893, "4": 0.05796495935842095, "3": 0.00033564080585998904, "2": 1.268963668075545e-06, "1": 0}, "score": 4.941359713323862}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8633115024619396, "4": 0.13461656513369166, "3": 0.0020441069175697727, "2": 1.3210124695459357e-05, "1": 0}, "score": 4.861253562827662}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.916516058780917, "4": 0.08281734987401684, "3": 0.0006566108687219809, "2": 2.0522393400625237e-06, "1": 0}, "score": 4.915862604609307}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9727803805439297, "4": 0.026888413770766995, "3": 0.0003047743168515849, "2": 1.2226315671470144e-06, "1": 0}, "score": 4.972497676401989}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6076738329046546, "4": 0.381477045170907, "3": 0.010798701322489099, "2": 4.204185030332763e-05, "1": 6.122488049626907e-06}, "score": 4.596774026896923}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5914514076469919, "4": 0.40392761009877065, "3": 0.004606628658648195, "2": 9.234214544135433e-06, "1": 0}, "score": 4.5868293147621255}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.809193310928419, "4": 0.1892681095676798, "3": 0.0015226211324523753, "2": 2.132149355371797e-06, "1": 0}, "score": 4.807677592627031}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9315013217440078, "4": 0.06819609321575439, "3": 0.00029750723914920497, "2": 3.0328314373741473e-07, "1": 0}, "score": 4.931207654006225}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9514217654114983, "4": 0.048394611698520405, "3": 0.00015961538186377703, "2": 2.7528098425361367e-07, "1": 0}, "score": 4.951284175559788}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5155225152248792, "3": 0.24338186699302522, "1": 0.18502805809971168, "4": 0.04912415548920106, "5": 0.00690329116957791}, "score": 2.1773191061859416}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6676642310127128, "5": 0.16271439385265243, "3": 0.15178861755509546, "2": 0.014313440328757017, "1": 0.0035159518281737668}, "score": 3.971750945085514}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.3246547074681029, "4": 0.30379701937827885, "2": 0.2516961683600111, "1": 0.07380113264501896, "5": 0.04604740820767036}, "score": 2.9965933900026136}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3616434851823285, "4": 0.317595918742091, "2": 0.18941672442314977, "5": 0.07282328689480022, "1": 0.0585080106459584}, "score": 3.1568117185846867}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.3822743861004533, "1": 0.29551596988270273, "3": 0.23118636935474154, "4": 0.07541484802097344, "5": 0.015584000499965233}, "score": 2.133255351927919}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8809976327966689, "4": 0.1123263281415627, "3": 0.00639598390775095, "1": 0.00014121217661120942, "2": 0.0001044588859354572}, "score": 4.873999146253803}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.870136267750819, "4": 0.11860407901097862, "3": 0.009391411289350548, "1": 0.0011421621386775395, "2": 0.0007044485216885623}, "score": 4.855927987827287}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9176719501547203, "4": 0.07779416893719636, "3": 0.00438968415918151, "2": 7.814871062135074e-05, "1": 6.12344266282122e-05}, "score": 4.912946659865092}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9189871365037353, "4": 0.07964460330800216, "3": 0.0013139881200742137, "2": 1.2449712844728413e-05, "1": 0}, "score": 4.917686628774254}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4803398186700127, "5": 0.4298763370120744, "3": 0.08371542745604527, "2": 0.0048685311465497165, "1": 0.001198590734786121}, "score": 4.332828506065008}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"4": 0.808362857664427, "5": 0.09571349278716072, "3": 0.09340753149564386, "2": 0.0023735244945820733, "1": 0.00010498532284560852}, "score": 3.9972438526799787}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6606211170939238, "5": 0.3120624346919753, "3": 0.0270851492353017, "2": 0.00020039162120137936, "1": 1.8024961693189248e-05}, "score": 4.284526092706963}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6474353279568917, "5": 0.31080763349361157, "3": 0.041199341737476906, "2": 0.0005033460762957567, "1": 3.808572568381736e-05}, "score": 4.268491709446842}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6139520674037399, "4": 0.3793865017501014, "3": 0.00661706077049086, "2": 2.1914851506512175e-05, "1": 0}, "score": 4.60730481409597}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8556951751988923, "5": 0.0776730056192368, "3": 0.06523827124310615, "2": 0.0013218888741154157, "1": 5.5156221947351026e-05}, "score": 4.0096256468125935}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6570666432166451, "4": 0.32216707549702567, "3": 0.020498497258255914, "2": 0.0002123817914304289, "1": 2.920726728593889e-05}, "score": 4.636072422471285}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5468952467100807, "4": 0.4422544870657194, "3": 0.010739465052864229, "2": 8.467941670056259e-05, "1": 1.9178340781374038e-05}, "score": 4.535932609003374}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6824678767934574, "5": 0.282999060820467, "3": 0.0342332049830759, "2": 0.0002684035302526512, "1": 2.6561971711118903e-05}, "score": 4.248150576789817}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5290194924876289, "5": 0.4601692142852495, "3": 0.01073829021965199, "2": 5.3646142107532326e-05, "1": 0}, "score": 4.4493323294467855}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5515642205580094, "4": 0.43486262602972303, "3": 0.013439226468104038, "2": 0.00010036901639272741, "1": 0}, "score": 4.537942308286246}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6865402395352114, "5": 0.23754269577030224, "3": 0.0753702985507151, "2": 0.00037493158074005165, "1": 0}, "score": 4.161450276795872}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7411780641925765, "5": 0.20338960558338928, "3": 0.05514440439442546, "2": 0.00026420664890811486, "1": 1.72527501190977e-05}, "score": 4.147665984512628}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6386593789591959, "5": 0.30427484214871786, "3": 0.056822363906409275, "2": 0.00020222087850646075, "1": 0}, "score": 4.247058213827834}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6744878208889606, "4": 0.29835372492719353, "3": 0.026986304025274556, "2": 0.0001194351513997659, "1": 3.488209142995085e-05}, "score": 4.6471695412064955}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5325701782187219, "5": 0.41858719897667673, "3": 0.04841765785885322, "2": 0.00032900026556854624, "1": 5.404075899022771e-05}, "score": 4.369364903534821}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"2": 0.47692622720617706, "3": 0.32095501688066497, "4": 0.0918548835482555, "1": 0.08952909703506205, "5": 0.020465126249747397}, "score": 2.4766595965130738}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.527936588513748, "5": 0.39421942833543017, "3": 0.07268025695726307, "2": 0.004298692810746679, "1": 0.0008354913191406315}, "score": 4.310444482969935}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6456028806906694, "4": 0.3241469229757156, "3": 0.028843633104565853, "2": 0.0009714079927632067, "1": 0.0004294029940103512}, "score": 4.613531751801827}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8588194030682722, "4": 0.12696055897614586, "3": 0.013047901013855837, "2": 0.0006518731957488932, "1": 0.000513844020821304}, "score": 4.842931634989875}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8267199127341386, "4": 0.1620800872771478, "3": 0.010928082792521287, "2": 0.00018545709434531046, "1": 7.851899405186199e-05}, "score": 4.8151918322969856}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5939096711227774, "5": 0.39425663257833676, "3": 0.01178280516087966, "2": 3.144690468035178e-05, "1": 0}, "score": 4.3824183694401}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6027507907608151, "5": 0.36020052093612603, "3": 0.03651378932544671, "2": 0.0004614213228131234, "1": 7.203683302239003e-05}, "score": 4.32254824320052}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5352435296760909, "5": 0.41743367900177963, "3": 0.046653949168431304, "2": 0.0005528211646355248, "1": 0.0001089352379018786}, "score": 4.369349898911846}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8562748139756777, "4": 0.14098849326270643, "3": 0.0027215437623168376, "2": 1.026485123549751e-05, "1": 3.915854457891855e-06}, "score": 4.853521819407236}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5871131605294354, "5": 0.3924661843474415, "3": 0.020301226013589135, "2": 0.00010344111958896844, "1": 8.296075386401865e-06}, "score": 4.3719360487688235}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.42130276373587117, "4": 0.3677248539311022, "2": 0.16016185200729044, "5": 0.025552221984206484, "1": 0.02525202319338574}, "score": 3.20816470785148}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5762291312947102, "4": 0.36882109127919965, "3": 0.05348756938612681, "2": 0.0010333472381246697, "1": 0}, "score": 4.520898260277912}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6094997867121016, "3": 0.25639162968572315, "5": 0.11036440672228241, "2": 0.02128927828286713, "1": 0.0024436682193944566}, "score": 3.8040610153438514}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.526955307257501, "4": 0.42972923271236346, "3": 0.042406844622358615, "2": 0.0006428513772651826, "1": 0.0002438807943000794}, "score": 4.482541677071214}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7262414526804293, "4": 0.20435955746289233, "3": 0.0643026137027098, "2": 0.0027017604497975222, "1": 0.0023874438600524676}, "score": 4.649377643733201}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.729382101186766, "5": 0.23294674820826464, "3": 0.037372168848999396, "2": 0.00024166284637647595, "1": 0}, "score": 4.195102436725444}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5211431056463588, "4": 0.4527648876692461, "3": 0.02583261598497606, "2": 0.0002075699845952855, "1": 0}, "score": 4.49492099685203}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8905140310533187, "4": 0.10599707283664457, "3": 0.0034697442184586733, "2": 1.1608755036529167e-05, "1": 0}, "score": 4.8870277602962995}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9659069948769406, "4": 0.03377431758760822, "3": 0.000315332474864888, "2": 1.1988881168411987e-06, "1": 0}, "score": 4.96559134660732}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9028414286719223, "4": 0.09430918426223635, "3": 0.0028158184884228554, "2": 1.26759127404352e-05, "1": 0}, "score": 4.900019062154488}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6669296039104754, "5": 0.28018639524149197, "3": 0.051977569979784304, "2": 0.0008108471440282603, "1": 7.067914552020836e-05}, "score": 4.226380731453833}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5827057715748356, "4": 0.4038810803182541, "3": 0.013320457068588839, "2": 7.64245941986476e-05, "1": 1.1301953173160358e-05}, "score": 4.569201385253455}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.769425304954158, "4": 0.22656101238036164, "3": 0.003957229973985094, "2": 2.3953478609471268e-05, "1": 0}, "score": 4.765445044384404}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6296098985727947, "5": 0.3304674538602792, "3": 0.03917276672590081, "2": 0.0005505451988971776, "1": 0}, "score": 4.290251454196586}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5167112867573771, "5": 0.4727846403440063, "3": 0.010411992626742913, "2": 7.718387467641075e-05, "1": 8.948425168382736e-06}, "score": 4.462194183810482}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8542974788145453, "4": 0.14162452692145067, "3": 0.004036342172420649, "2": 2.188926990251756e-05, "1": 0}, "score": 4.850234161128434}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9160975906244168, "4": 0.08253295589604169, "3": 0.0013560580237544874, "2": 5.976801495902495e-06, "1": 0}, "score": 4.914736365110531}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5413559869446836, "4": 0.4512427210961466, "3": 0.007338256489956434, "2": 2.180718620626846e-05, "1": 0}, "score": 4.533996131825963}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7537013552538442, "4": 0.2429285528664486, "3": 0.003348317158857647, "2": 1.0271186602969696e-05, "1": 0}, "score": 4.750341127296635}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9080881078603066, "4": 0.09096895359158706, "3": 0.0008927299771719863, "2": 1.2980141997853948e-06, "1": 0}, "score": 4.907237155329092}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"5": 0.38177068563965555, "4": 0.30723799614167746, "3": 0.20413519174445205, "2": 0.06364567538266756, "1": 0.04319660823038181}, "score": 3.9207532214365695}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5883622790351101, "4": 0.22428098856711517, "3": 0.08846150441149386, "1": 0.06704684666266333, "2": 0.0318453788035852}, "score": 4.235070182831389}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.44596460102996505, "4": 0.412287812290865, "3": 0.1108659128747246, "2": 0.020200660037197716, "1": 0.010679368248092628}, "score": 4.262659695548127}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5403038567465477, "4": 0.4038700545152643, "3": 0.050968901844330734, "2": 0.0029662136642957223, "1": 0.001880401426874948}, "score": 4.477766374144839}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.46367274803187536, "4": 0.43968199588273704, "3": 0.08501608543361969, "2": 0.006827765626435578, "1": 0.00479421162606878}, "score": 4.350621018624156}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7270519616000084, "4": 0.26804765422660193, "3": 0.004877020982138972, "2": 1.4305421023262424e-05, "1": 0}, "score": 4.722152870870596}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8814383651574902, "4": 0.11652458478992608, "3": 0.0020291992943899354, "2": 5.41964089631572e-06, "1": 1.0768170976263833e-06}, "score": 4.879396287096582}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8250904188886835, "4": 0.17218276140233918, "3": 0.0027121936678623374, "2": 1.0400392626307374e-05, "1": 0}, "score": 4.8223608994436615}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9178737858452645, "4": 0.08120438750186906, "3": 0.0009157670846709922, "2": 2.5504263925697116e-06, "1": 0}, "score": 4.916956135636915}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8137918322677469, "4": 0.18315512639579493, "3": 0.003037853799186391, "2": 9.309259574191687e-06, "1": 0}, "score": 4.810740125705012}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8041438643914597, "5": 0.12401482054436944, "3": 0.0712431645910285, "2": 0.00048528000680556836, "1": 0}, "score": 4.051806943413592}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.732034276717742, "4": 0.2606705837614511, "3": 0.007252986238177106, "2": 2.8507053787422412e-05, "1": 0}, "score": 4.724734166260272}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6553163059912799, "5": 0.3086027586041091, "3": 0.03082966818108779, "2": 0.00012543711508404613, "1": 0}, "score": 4.2789520771487135}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7387998453374464, "4": 0.25166143668531804, "3": 0.009431918090482001, "2": 5.4482827374146244e-05, "1": 0}, "score": 4.729297116272753}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.68625475309266, "4": 0.2934480374064465, "3": 0.020144217590220028, "2": 0.00011028760647337422, "1": 0}, "score": 4.665918397871328}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8010725113348189, "4": 0.19634271514921883, "3": 0.0025633794330746696, "2": 1.4142982405071104e-05, "1": 0}, "score": 4.798486635843764}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6946860028275228, "4": 0.30258531748641504, "3": 0.0027141647924863615, "2": 6.560826316892581e-06, "1": 0}, "score": 4.691964220312353}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5986515019065487, "4": 0.39805073776548094, "3": 0.0032447291473449947, "2": 7.45765154209732e-06, "1": 0}, "score": 4.595418992800904}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6299346721331536, "5": 0.35588696948179394, "3": 0.014129167517221184, "2": 3.164248114992942e-05, "1": 0}, "score": 4.34170051329501}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6495977979472132, "4": 0.3447567096962261, "3": 0.00560774500583058, "2": 1.3347292535708058e-05, "1": 0}, "score": 4.643979071483131}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9775171964511179, "4": 0.021799950060335846, "3": 0.0006711751679462905, "2": 7.669876840616605e-06, "1": 2.16455664584555e-06}, "score": 4.976825989016406}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9872003157372272, "4": 0.011888789282488392, "3": 0.000882892860949556, "2": 1.856098056195305e-05, "1": 7.783519065477036e-06}, "score": 4.986258585199625}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9910403510237534, "4": 0.008631016448497461, "3": 0.00032132001499236184, "2": 5.768393148635976e-06, "1": 1.140747281754437e-06}, "score": 4.990704471603387}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979264815157642, "4": 0.0020436374401323547, "3": 2.861017883887247e-05, "2": 4.0423113752433664e-07, "1": 0}, "score": 4.99789792768705}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9771480305620727, "4": 0.022442930817848067, "3": 0.0003997539600431363, "2": 4.782462388807948e-06, "1": 0}, "score": 4.9767431091677805}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9615287184659792, "4": 0.03818164409233318, "3": 0.0002267380889015811, "2": 5.733422520653945e-07, "1": 0}, "score": 4.961360751472896}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9778829833814916, "4": 0.022028167580451577, "3": 7.908898080797887e-05, "2": 1.8965086647708106e-07, "1": 0}, "score": 4.977812873165514}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9862891774113633, "4": 0.013541778074421284, "3": 9.531112666757397e-05, "2": 3.0763125353691243e-07, "1": 0}, "score": 4.986265668324792}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9929528623532516, "4": 0.006987702224676405, "3": 4.567908607186532e-05, "1": 0, "2": 0}, "score": 4.992920842219906}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9757779077481602, "4": 0.023999362775680218, "3": 0.00011255022404355111, "1": 0, "2": 0}, "score": 4.975772867448887}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7560103215892279, "4": 0.2402072227631595, "3": 0.003669375848160806, "2": 2.6225430190086516e-05, "1": 0}, "score": 4.75235384009893}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.961126489389088, "4": 0.03869547928928795, "3": 0.0001714851301126282, "2": 2.213603323651488e-07, "1": 0}, "score": 4.960960639452124}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6039254595525291, "4": 0.3883989678536047, "3": 0.007627195984384849, "2": 2.030642945786626e-05, "1": 0}, "score": 4.596274388238649}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9409604810852044, "4": 0.058721138866411435, "3": 0.00029899610841282786, "2": 8.035431103527285e-07, "1": 0}, "score": 4.940677356049165}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973068168423717, "4": 0.0026732064753733384, "3": 9.940770750600748e-06, "1": 0, "2": 0}, "score": 4.997306884955262}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"4": 0.542237300260671, "5": 0.4382085238707639, "3": 0.019322997734364352, "2": 0.0001645355338236277, "1": 0}, "score": 4.418584350618355}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8015109861817156, "4": 0.1958448529083836, "3": 0.002619031725334887, "2": 6.391727383819567e-06, "1": 0}, "score": 4.798894140246359}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8206841560030886, "4": 0.1783820465198278, "3": 0.000909654500796927, "2": 2.200070835860376e-06, "1": 0}, "score": 4.819788089893166}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971871966651561, "4": 0.0027853484408995478, "3": 2.7088697052919266e-05, "2": 1.233442019426014e-07, "1": 0}, "score": 4.997160103442712}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9899395824936147, "4": 0.009993214163301999, "3": 6.335586972525226e-05, "2": 3.173768398033152e-07, "1": 0}, "score": 4.989879086238926}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7603251714769819, "5": 0.13069604747636698, "3": 0.1072855829974032, "2": 0.0015990733080437775, "1": 8.622042150002687e-05}, "score": 4.019953814319704}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.739910090122562, "4": 0.25576070953818997, "3": 0.004304359210140834, "2": 1.4573583753793948e-05, "1": 0}, "score": 4.735584136388395}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6228013944646457, "5": 0.28280049347503916, "3": 0.0918476089295572, "2": 0.0023295993010313647, "1": 0.00021670122423319681}, "score": 4.185644362460737}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7332046653786046, "5": 0.20847803312673405, "3": 0.05778436740533788, "2": 0.000504884029305982, "1": 2.245619579257733e-05}, "score": 4.149617366014637}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5518929956258425, "5": 0.42515250462994275, "3": 0.0227603225052033, "2": 0.00017220825993824134, "1": 1.3786385648076156e-05}, "score": 4.402009695929814}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7641586762146909, "4": 0.2135349840538491, "3": 0.02124558648514441, "2": 0.0006668506834521615, "1": 0.00038764038147590725}, "score": 4.74042110386947}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8752178606638241, "4": 0.12006602249972882, "3": 0.00462916579955207, "2": 5.095146729428548e-05, "1": 3.182768657368956e-05}, "score": 4.8703949400558395}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.657835104583113, "5": 0.29211418752132207, "3": 0.04809407934438556, "2": 0.0016102827408009963, "1": 0.000335975942589649}, "score": 4.239794101500695}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9921688078210007, "4": 0.007681017143746844, "3": 0.00014485229353668793, "1": 1.5002661984019009e-06, "2": 0}, "score": 4.992023246713442}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8167404346891692, "4": 0.17593112425455706, "3": 0.0072406326051476354, "2": 5.527344299265737e-05, "1": 2.2483148160881833e-05}, "score": 4.809329941024792}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6941756448051467, "4": 0.2890786738680133, "3": 0.01653143762948871, "2": 0.00015774480325525056, "1": 3.09736411704657e-05}, "score": 4.677253083701893}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5864666061618847, "4": 0.382011448855027, "3": 0.03125959843626934, "2": 0.0002156601001763247, "1": 0}, "score": 4.554801589240056}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.589196579346675, "5": 0.3618887987938106, "3": 0.04809998565996942, "2": 0.0006352632995832994, "1": 0.00010749244413318239}, "score": 4.312218251592517}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5356212450837802, "5": 0.4263069296527589, "3": 0.03760607772599834, "2": 0.0003738406204149499, "1": 0}, "score": 4.387988829543103}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5303764349101019, "5": 0.43470419095742113, "3": 0.03442177915378099, "2": 0.00043603807083429045, "1": 3.552169220743556e-05}, "score": 4.399314166815796}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9727176606053518, "4": 0.02689683923058073, "3": 0.00037337682260762814, "2": 1.028721282798415e-06, "1": 0}, "score": 4.97235301422755}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6427408812651124, "4": 0.3456273871383451, "3": 0.011528274603515062, "2": 9.256402414077284e-05, "1": 1.033386698263407e-05}, "score": 4.6309968298038955}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.981815156515254, "4": 0.018154198912247527, "3": 2.531716332354033e-05, "1": 0, "2": 0}, "score": 4.981795069775993}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902475055436968, "4": 0.009727396432885723, "3": 2.079745363802276e-05, "1": 0, "2": 0}, "score": 4.990230966647429}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9482600756015279, "4": 0.05110658117233207, "3": 0.0006275815093597419, "2": 3.7650590985860784e-06, "1": 8.704817873616e-07}, "score": 4.947623419719262}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6353556043400704, "5": 0.32766370047860166, "3": 0.03632540210274988, "2": 0.0005201383625267856, "1": 0}, "score": 4.2903372621010165}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9228965877779263, "4": 0.07600374223301185, "3": 0.001086014614911187, "2": 1.048792460731313e-05, "1": 2.11921462038697e-06}, "score": 4.921784205916336}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8703568143305346, "4": 0.12784273541716454, "3": 0.0016129286744574372, "2": 4.216336225599761e-06, "1": 0}, "score": 4.868894725941306}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8076714212800301, "4": 0.1901122104177522, "3": 0.0021487843829980143, "2": 3.46600473688444e-06, "1": 0}, "score": 4.805567356186412}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8596602722911142, "4": 0.13885373028719955, "3": 0.00147920573618802, "2": 5.3992851110529675e-06, "1": 0}, "score": 4.858171462902982}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"3": 0.49313751931166355, "4": 0.28625988269813785, "2": 0.16840038347652317, "1": 0.028809139454859373, "5": 0.023388004880344367}, "score": 3.1070177726717922}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6115607395536709, "4": 0.2878094931039706, "2": 0.05189454501594921, "5": 0.044486411321708476, "1": 0.004241617909894835}, "score": 3.3164068108558364}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5606277393152309, "3": 0.37685457826263813, "5": 0.05443372349511029, "2": 0.007506113928954042, "1": 0.0005741746153383606}, "score": 3.6608431486930995}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.610109621855796, "5": 0.235571995233964, "3": 0.1525714756423626, "2": 0.0016039916103605942, "1": 0.00013319764236194908}, "score": 4.079393714993119}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6383022383433806, "3": 0.2600559965004683, "5": 0.09839335575684367, "2": 0.002884986668509487, "1": 0.00036085115416108204}, "score": 3.831484399106091}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7645507290201621, "5": 0.156623804292649, "3": 0.07774527511456922, "2": 0.0010366574833532798, "1": 4.073287711827329e-05}, "score": 4.076683230386016}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4828983031419466, "4": 0.4579425039387729, "2": 0.03375907530109205, "5": 0.02356925194801456, "1": 0.001829060192600215}, "score": 3.4676646565065585}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6866116502991779, "5": 0.2574837931712175, "3": 0.055183614970857005, "2": 0.0006536653726929707, "1": 6.103500536146792e-05}, "score": 4.2008109957365996}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8649136012386424, "3": 0.10077894743193433, "5": 0.03344652447161426, "2": 0.0008049881509265033, "1": 5.332565556061539e-05}, "score": 3.930897443202618}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8094663626261609, "3": 0.13572407696328592, "5": 0.05325909451293895, "2": 0.0014948781208168763, "1": 5.446670284379169e-05}, "score": 3.9143817652151145}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6683091320244267, "3": 0.21081407396578725, "5": 0.11208858307356408, "2": 0.007278617053483869, "1": 0.001501139789131473}, "score": 3.8822128598499064}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.541682198036135, "3": 0.3388997967851596, "5": 0.10155220274044542, "2": 0.016286968002439974, "1": 0.0015324684157363383}, "score": 3.725468335762539}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.48763308057656324, "4": 0.4375118446785406, "2": 0.037104081572082004, "5": 0.03501945551763037, "1": 0.0027241868474607535}, "score": 3.4650017185850213}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5481985720030541, "4": 0.4127126875107002, "3": 0.03842811214977019, "2": 0.0005195124927874924, "1": 0.0001241920996986178}, "score": 4.508367462049392}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7002141935210466, "3": 0.15929309641672978, "5": 0.13453024975311656, "2": 0.0051128949948055545, "1": 0.000836561683724206}, "score": 3.9625011906749394}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8758262521611233, "5": 0.09789384516621226, "3": 0.026067047766699304, "2": 0.00018516819199312391, "1": 1.4679978490555403e-05}, "score": 4.071413349934609}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7152632372913752, "5": 0.27149984785365455, "3": 0.01317276682329264, "2": 3.584666577949222e-05, "1": 0}, "score": 4.258262696885885}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7208714583833891, "5": 0.2699841298620439, "3": 0.009080284992702352, "2": 4.229718595548688e-05, "1": 0}, "score": 4.26082494419535}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5800352102248851, "5": 0.411105769861181, "3": 0.00872710481888948, "2": 1.9748263392042607e-05, "1": 0}, "score": 4.402384302687846}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8004004292326711, "4": 0.1981901015616751, "3": 0.0011034043663014051, "2": 1.697121461542132e-06, "1": 0}, "score": 4.799536983870596}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9328597788977726, "4": 0.06609817117872914, "3": 0.0010328141684935906, "2": 2.744556671646125e-06, "1": 0}, "score": 4.931827524293208}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9336938670044626, "4": 0.06521563749016805, "3": 0.001084917317459416, "2": 2.132366845697863e-06, "1": 0}, "score": 4.932607898553254}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.836615360095286, "4": 0.16094894115162958, "3": 0.0024068082183168206, "2": 6.239122565333344e-06, "1": 0}, "score": 4.834214969778984}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6903825256537448, "4": 0.3057424799923219, "3": 0.003854665677929942, "2": 7.104387549928139e-06, "1": 0}, "score": 4.6865227299753265}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7958695249121303, "4": 0.20270349164382442, "3": 0.001407825448735319, "2": 3.2397399296768157e-06, "1": 0}, "score": 4.794467866525926}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8737224208958233, "4": 0.12107543474391663, "3": 0.005072264064562846, "2": 8.361513613630009e-05, "1": 0}, "score": 4.868523108919206}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969852505113399, "4": 0.0027499157613752917, "3": 0.00021817730501248422, "1": 2.000404609742309e-05, "2": 0}, "score": 4.996733626387591}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7593816767985195, "4": 0.23565863098361797, "3": 0.004873097047349856, "2": 6.045562095693165e-05, "1": 1.804155228845059e-05}, "score": 4.754339652492836}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9700964707970733, "4": 0.02868758007155364, "3": 0.0011215136868740155, "2": 1.2791316700728352e-05, "1": 0}, "score": 4.969028489962673}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962965821302932, "4": 0.0036319158048348046, "3": 5.988227538819158e-05, "2": 3.650395985756854e-07, "1": 0}, "score": 4.996247182288569}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5176340259660727, "4": 0.44368745260642733, "5": 0.02331983483668128, "2": 0.014731218935948788, "1": 0.0004291592052804146}, "score": 3.4748317480810584}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6312302411695514, "5": 0.29575576011965904, "3": 0.07133751020977455, "2": 0.0014155198927449182, "1": 0}, "score": 4.221645052525282}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7166800516371111, "4": 0.2734297078067886, "3": 0.009288293826687367, "2": 1.95524296594338e-05, "1": 0}, "score": 4.707764851165989}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5524708318585658, "4": 0.4299693723174608, "3": 0.01745262869729889, "2": 3.687130321966231e-05, "1": 0}, "score": 4.534982067559802}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.824179799169371, "5": 0.1276538468283237, "3": 0.04783304310309947, "2": 0.000300303178084206, "1": 0}, "score": 4.079222812333552}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6148998438293861, "5": 0.33408320508799716, "3": 0.04991398774373518, "2": 0.0009552577104626153, "1": 0}, "score": 4.282300399281216}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8037743889021296, "4": 0.19187103986379708, "3": 0.004306460250047428, "2": 2.6340760226808987e-05, "1": 0}, "score": 4.799432650959353}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6748168420779805, "4": 0.3163864720024549, "3": 0.00870025102751938, "2": 8.361881528323079e-05, "1": 1.1105800706226962e-05}, "score": 4.665917174919977}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7700792248589144, "4": 0.22766275267306757, "3": 0.002170002411803938, "2": 4.3736222589061245e-06, "1": 0}, "score": 4.767964712712214}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9003784266290342, "4": 0.09885171302262354, "3": 0.0007590039320617862, "2": 2.041087099771171e-06, "1": 0}, "score": 4.899623270998046}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7827545859700522, "5": 0.16435867443650964, "3": 0.05252116750881343, "2": 0.000327969808851858, "1": 2.7264842670123003e-05}, "score": 4.111100921280324}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5713665678986536, "4": 0.40545488877997576, "3": 0.022923288961104075, "2": 0.00020019112955136894, "1": 3.366112322606678e-05}, "score": 4.547953640671485}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5196205215841249, "5": 0.3871787137151929, "3": 0.0922588745135132, "2": 0.0007800431650532255, "1": 0.00013901523868712197}, "score": 4.292949395712672}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6247110850766374, "4": 0.36044784744644437, "3": 0.01471355648952825, "2": 8.668428047643425e-05, "1": 2.4022732221705037e-05}, "score": 4.609762338260391}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.864190801058495, "4": 0.13477012900204982, "3": 0.001013396924257093, "2": 1.8465694346056848e-06, "1": 0}, "score": 4.863194277847013}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9426738504114854, "4": 0.05570856353335156, "3": 0.0015848218110867665, "2": 1.1353516934088037e-05, "1": 1.0406889700002617e-05}, "score": 4.941045456008655}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4231078998822125, "5": 0.27896574011150405, "3": 0.23496559025638453, "2": 0.03809329487004456, "1": 0.0248619315205151}, "score": 3.893227173673341}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8736728385553496, "4": 0.11518604214463259, "3": 0.010939255908258134, "2": 0.00011717675929687843, "1": 7.035659733863854e-05}, "score": 4.862300516133166}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6714687511442736, "4": 0.2888645459148815, "3": 0.036902229858197876, "1": 0.0013808536280479479, "2": 0.0013699586802478044}, "score": 4.627692617808649}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7087249630973294, "4": 0.25103093510861857, "3": 0.03545953825480358, "2": 0.0027161267567377273, "1": 0.002053754700243909}, "score": 4.661681622092329}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4953111638846623, "2": 0.46851488790331225, "4": 0.0316495736897764, "1": 0.004339964980116325, "5": 0.00018221322330564188}, "score": 2.554818204511684}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8334921457925448, "3": 0.1523703208155059, "1": 0.012280060863062197, "4": 0.0018454668468023765, "5": 1.160404283862524e-05}, "score": 2.14381606353674}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8963747013094328, "3": 0.10229498803909105, "1": 0.0012505635365761326, "4": 7.900542792074477e-05, "5": 0}, "score": 2.1012025104189407}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.7630197983501895, "3": 0.2281155226628486, "1": 0.0067034296198045015, "4": 0.002152842967198618, "5": 8.240660990223446e-06}, "score": 2.2257425383747473}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.7966289634962046, "3": 0.18618298473020292, "1": 0.013854100848921455, "4": 0.003323970090745782, "5": 9.736177219001704e-06}, "score": 2.179006076389467}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"4": 0.628938777554862, "5": 0.3014620624757171, "3": 0.06778871793641016, "2": 0.0016306411466481864, "1": 0.00016356648732188933}, "score": 4.2299250954797945}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5116175529274556, "4": 0.4571856793767925, "3": 0.03090162832082558, "2": 0.00025304125988091607, "1": 3.3587351678688736e-05}, "score": 4.480113166161379}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.838732856709175, "4": 0.15717117200438385, "3": 0.0040324707562745385, "2": 1.970374182305695e-05, "1": 0}, "score": 4.83469753554055}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9082852479417045, "4": 0.08918729341925373, "3": 0.00249946692461191, "2": 9.634067917591066e-06, "1": 0}, "score": 4.905783140927976}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6464667453932534, "4": 0.33970244714497333, "3": 0.013685974906082766, "2": 0.00010251934966320349, "1": 0}, "score": 4.632602499227728}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5180343117586714, "3": 0.2926958101127023, "5": 0.162562115665846, "2": 0.023065709535805633, "1": 0.003615354733391178}, "score": 3.812883826617539}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7019862233545249, "3": 0.2063392747801207, "5": 0.08176078919439536, "2": 0.008984458748641323, "1": 0.000922814425012906}, "score": 3.854683217874927}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8710452166385473, "4": 0.12318848477333548, "3": 0.00567212416003402, "2": 6.490168315492507e-05, "1": 0}, "score": 4.8652686178997495}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6322207233502773, "4": 0.3360312894471601, "3": 0.030702143683581682, "2": 0.0008360787924321556, "1": 0.00020611588475309784}, "score": 4.599230260923993}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5433279944844253, "4": 0.4151356685528661, "3": 0.04052822232598417, "2": 0.0007462838008588512, "1": 0.00015234223835105469}, "score": 4.500905021229933}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9200209384621947, "4": 0.07892681881112484, "3": 0.0010280566566449548, "2": 1.2692504862737674e-06, "1": 0}, "score": 4.91901140412309}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.933068865531149, "4": 0.06667168026199227, "3": 0.00024425177498130696, "2": 4.3843950219501943e-07, "1": 0}, "score": 4.932837509283038}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8401532527799218, "4": 0.15580628596279167, "3": 0.003919670832525766, "2": 8.990761570487565e-06, "1": 0}, "score": 4.836309099499902}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9968295804280084, "4": 0.0031266141535907315, "3": 4.133330361580767e-05, "2": 1.4874007759340302e-07, "1": 0}, "score": 4.996790265561528}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9908640566633459, "4": 0.00893174495041923, "3": 0.00018656534591648117, "1": 1.0445638866610036e-05, "2": 3.859592307053648e-06}, "score": 4.990641731882828}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7257165263351457, "5": 0.2235346149917777, "3": 0.049561334283243295, "2": 0.0010516186819540918, "1": 0.00012635817815849365}, "score": 4.171492606140904}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5114812403605384, "4": 0.4719577547738281, "3": 0.016276970873519134, "2": 0.000232459393454237, "1": 3.282362590123956e-05}, "score": 4.494650154993989}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.598462417764509, "4": 0.3822051395452097, "3": 0.01912559095765994, "2": 0.00016809084174958954, "1": 0}, "score": 4.579023088574097}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6646230507625012, "5": 0.3018472150661763, "3": 0.03289092155062304, "2": 0.0005206570428741289, "1": 6.820995745727575e-05}, "score": 4.267723721184774}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.593408587227955, "5": 0.3884904854307783, "3": 0.01797662457077559, "2": 8.317639203341695e-05, "1": 0}, "score": 4.370362739754137}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.982865887484218, "4": 0.016563125664158455, "3": 0.0005597341606903159, "2": 5.024487998782032e-06, "1": 4.153268264703887e-06}, "score": 4.982285682721355}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9859422283827293, "4": 0.013178063340084154, "3": 0.0008479360820112005, "1": 1.6066487131921435e-05, "2": 1.4782744050023747e-05}, "score": 4.985017436486849}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9748017110007642, "4": 0.02472112840457984, "3": 0.00046848920414428497, "2": 3.0308422705265335e-06, "1": 0}, "score": 4.974332655882428}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9796099987343082, "4": 0.0199364712203827, "3": 0.0004461903068412464, "2": 1.918187170454845e-06, "1": 0}, "score": 4.979165280647924}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9809650793924035, "4": 0.018472884958007543, "3": 0.0005532130878564914, "2": 3.2522060736673564e-06, "1": 2.8708224537356427e-06}, "score": 4.980399396045761}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7628028416304728, "4": 0.23345605987224327, "3": 0.00371557252863055, "2": 1.515113668667476e-05, "1": 0}, "score": 4.759064841998657}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8964804528705794, "4": 0.10273255716171079, "3": 0.000760431593261244, "2": 9.416661789154573e-07, "1": 0}, "score": 4.8957410838829905}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6116453670680224, "5": 0.38078018980083084, "3": 0.007549637727386849, "2": 1.718066387221866e-05, "1": 0}, "score": 4.373199036291277}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9512353278488406, "4": 0.048572463660352304, "3": 0.00018659594514227937, "2": 2.879292634497455e-07, "1": 0}, "score": 4.951053220038745}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6336399424410873, "5": 0.3576335929779264, "3": 0.008699993503900338, "2": 1.446664359996154e-05, "1": 0}, "score": 4.348908854639965}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4351381117541349, "5": 0.36635315735571333, "3": 0.13691758548092497, "2": 0.033258729665789466, "1": 0.028293259016591868}, "score": 4.0780413913388776}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.572919305661756, "4": 0.2967202212940964, "3": 0.08458316732130154, "1": 0.02455255148498538, "2": 0.021173133261340602}, "score": 4.372351438507682}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5863253726885144, "4": 0.3580540952307455, "3": 0.046773381932085495, "1": 0.004667159203486837, "2": 0.0041530843662840305}, "score": 4.517258262063632}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6182049637233712, "4": 0.35623024555871496, "3": 0.02415352854578989, "2": 0.0009987300860062195, "1": 0.0004068931246511393}, "score": 4.590836627336589}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9534606202540942, "5": 0.03144165414659349, "2": 0.007396857730254465, "3": 0.004632102547646536, "4": 0.0030653957464522774}, "score": 1.1516243775609842}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6602190137453143, "3": 0.199872323257549, "5": 0.12338321473253556, "2": 0.015338887630213358, "1": 0.0011350506539656406}, "score": 3.889422268395873}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7771318436980109, "3": 0.12348045432674887, "5": 0.09681929268122606, "2": 0.0023301328403592227, "1": 0.0002326459006671829}, "score": 3.967980454684011}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6642955188538727, "3": 0.20285620514043082, "5": 0.12253313448256788, "2": 0.009324776328124871, "1": 0.000970244457671559}, "score": 3.8981145933033665}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9312214010889412, "4": 0.06741525172107549, "3": 0.001344393899278995, "2": 9.37731578073169e-06, "1": 0}, "score": 4.929867156942677}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6071784526156446, "5": 0.35304579485347753, "3": 0.039096333060801104, "2": 0.000531282321024909, "1": 8.033163937357909e-05}, "score": 4.31266710278477}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5564531270144523, "3": 0.22290168035811472, "5": 0.19107803006332322, "2": 0.023413680282248796, "1": 0.006152723805559001}, "score": 3.902890744068964}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5550656965938346, "5": 0.22508188717250302, "3": 0.20925825917941884, "2": 0.008559384462504118, "1": 0.002033016557502365}, "score": 3.9926057964110937}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6962333861001463, "5": 0.2405356422002688, "3": 0.062117073018145764, "2": 0.0010173297261077173, "1": 7.874324985967366e-05}, "score": 4.176150819992965}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8515658906650441, "4": 0.14187135254654226, "3": 0.006497125049506493, "2": 5.129486029439003e-05, "1": 1.3407557734017005e-05}, "score": 4.844926738429805}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5702091247005419, "3": 0.2437729791772402, "5": 0.16681808027462372, "2": 0.015581444933445423, "1": 0.0036164825384045712}, "score": 3.8810325389600115}]