[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6191561725358833, "2": 0.3437070786178184, "4": 0.03439600345451038, "1": 0.0016262394751677637, "5": 0.0009156018036292719}, "score": 2.6892058312551583}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7596488818661854, "5": 0.21256647840262222, "3": 0.02620492260962171, "2": 0.0014940963545606667, "1": 7.509571936148444e-05}, "score": 4.18315000358831}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7093131439998501, "4": 0.28432725439673634, "3": 0.006313931738744765, "2": 3.6003298453392955e-05, "1": 3.030899857076744e-06}, "score": 4.702922777325652}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9283308131799146, "4": 0.07015536474634675, "3": 0.0014605064789916969, "2": 3.269265902212566e-05, "1": 0}, "score": 4.926824035215386}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9897626183991249, "5": 0.010222010412503002, "3": 1.263394902807525e-05, "2": 8.589629907497703e-07, "1": 0}, "score": 4.0102076777103335}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3616386030282332, "2": 0.27042015496463784, "3": 0.18588843445273923, "4": 0.14428049386360936, "1": 0.03776098697263319}, "score": 3.5216214792696467}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6521735966263418, "3": 0.277943256342909, "5": 0.06036899703164402, "2": 0.009314244350611237, "1": 0.00018832657520444283}, "score": 3.7632295306792827}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4218951101448301, "3": 0.3951735908948783, "2": 0.11734569998578087, "5": 0.06393813523949991, "1": 0.0015861540965359585}, "score": 3.4292796914276633}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5294116412047185, "5": 0.40991928685204315, "3": 0.0550141749825554, "2": 0.005391108265912575, "1": 0.0002560970714514716}, "score": 4.343357245097901}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7707681762072042, "4": 0.20731931287230076, "3": 0.020407853025023973, "2": 0.0014371126248123554, "1": 6.462217111131094e-05}, "score": 4.74729441583519}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6302089171781657, "4": 0.2040894705824626, "5": 0.11436793817784241, "2": 0.05063888092640956, "1": 0.0006931403874485139}, "score": 3.3808008146045}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5758160079254941, "4": 0.3473189350454688, "3": 0.07467288037124437, "2": 0.0020842720945709586, "1": 0.00010211580965212678}, "score": 4.496671111042818}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9833144095765329, "4": 0.016248754813563644, "3": 0.00042376957739272624, "2": 7.379800147523056e-06, "1": 0}, "score": 4.982881469291265}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9074984779814179, "4": 0.08529270925012289, "3": 0.006555610703825916, "2": 0.0005331216091856181, "1": 0.0001132282347171084}, "score": 4.899543103222969}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9372610815154022, "4": 0.05565565996295927, "3": 0.00611384504577313, "2": 0.0008193529619326953, "1": 0.000146604364128775}, "score": 4.92907192846514}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6212222938439993, "5": 0.2762857839164121, "3": 0.09523335794291735, "2": 0.0066786594013156534, "1": 0.000554861846738641}, "score": 4.166034679645202}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9448121446307746, "3": 0.05356111181854451, "1": 0.001535299658087839, "4": 8.853044976375916e-05, "5": 2.3452583302029017e-06}, "score": 2.052209938499853}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6701787574622738, "4": 0.30143089290995145, "2": 0.017453827734076836, "5": 0.010898581890500017, "1": 3.268484641026366e-05}, "score": 3.305710465820483}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6953412338178021, "2": 0.23440893579818406, "4": 0.06310643712366469, "5": 0.003910286632996498, "1": 0.0032301315985254157}, "score": 2.8300573058100085}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6072989409174617, "2": 0.27068291459456223, "4": 0.10092039916050993, "5": 0.01319869919604408, "1": 0.00789288545963469}, "score": 2.8408481315563403}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3743041263328019, "4": 0.305039317758313, "5": 0.21330705042910075, "2": 0.10563897440465911, "1": 0.0016881172910553405}, "score": 3.6226521656209365}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6310251246744072, "3": 0.2245187851049422, "5": 0.1310021164244053, "2": 0.013240777587819205, "1": 0.0002072623864485312}, "score": 3.87937927324256}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8936973104986115, "4": 0.10477111136595518, "3": 0.0014845078140729676, "2": 1.9617176960204044e-05, "1": 0}, "score": 4.892198061972846}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5740950810223596, "4": 0.42014192841114684, "3": 0.005669473628679047, "2": 5.592131190075373e-05, "1": 0}, "score": 4.568335131684883}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5147440459593992, "4": 0.42512599294639686, "3": 0.054630360372054126, "2": 0.005099911970944195, "1": 0.0003382852782410176}, "score": 4.448926571461327}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"2": 0.825985070565839, "3": 0.10976236151230463, "4": 0.03231247824443695, "1": 0.028014462060151162, "5": 0.0037611726319585308}, "score": 2.157682305478134}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6870410747318245, "4": 0.30771243030154877, "3": 0.004869847288387187, "2": 0.0003512558439059702, "1": 0}, "score": 4.681486019935744}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.989780138342293, "4": 0.01015512779081416, "3": 4.7428701293067584e-05, "2": 1.1369731025318648e-06, "1": 0}, "score": 4.989746438105729}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984204435145674, "4": 0.0015736092699309026, "3": 3.632537928953933e-06, "2": 2.0114958533988346e-07, "1": 0}, "score": 4.998418518862952}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9868325228261496, "4": 0.013116477693415276, "3": 3.167638840133303e-05, "2": 1.4954266607980008e-06, "1": 0}, "score": 4.986815448200022}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6451872333804036, "3": 0.3207093877585669, "5": 0.021035832201862253, "2": 0.013029298846490801, "1": 3.605399074798339e-05}, "score": 3.6741589699408728}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4119862516380308, "3": 0.40385129922543384, "2": 0.17014737597292695, "5": 0.012624341040434249, "1": 0.0013800083901674782}, "score": 3.2643303755740107}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7749524394217324, "4": 0.22399530212573387, "3": 0.0010014720614023938, "2": 3.756750913065163e-05, "1": 0}, "score": 4.773886062250607}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8720588664106615, "4": 0.12651909924972046, "3": 0.0013453133756751205, "2": 6.082303351663845e-05, "1": 0}, "score": 4.87060574779756}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6188277168479783, "3": 0.2315457501831229, "5": 0.10909777287094573, "2": 0.03823947193979738, "1": 0.002264290758472683}, "score": 3.794275063944359}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"2": 0.31249203441579787, "4": 0.2834244447932105, "3": 0.26472286305990606, "5": 0.12121538190404935, "1": 0.018136797380858626}, "score": 3.177091080880992}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4139478952340725, "3": 0.37175048091167723, "2": 0.13520911486570417, "5": 0.07422709750435182, "1": 0.004856124437686674}, "score": 3.417484603700629}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7208206099041616, "5": 0.26358918638866613, "3": 0.015273035363050878, "2": 0.0002888485660761913, "1": 0}, "score": 4.247745469990185}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6608625323317334, "5": 0.3031032719574211, "3": 0.03394917587298671, "2": 0.0019792929381425195, "1": 8.593159372748057e-05}, "score": 4.264942960053931}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.49465829891797986, "4": 0.4919428784211822, "3": 0.013180866612274012, "2": 0.00020191918800285181, "1": 1.185093251772974e-05}, "score": 4.481040054731202}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"2": 0.49793168006161515, "1": 0.2764644327802281, "3": 0.16484845197747422, "4": 0.038033314726754856, "5": 0.022614336848646607}, "score": 2.0322971402989176}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9711261757529679, "4": 0.027040533445173216, "3": 0.0016214621095824156, "2": 0.00016817423548703454, "1": 2.4030276544019257e-05}, "score": 4.969115292435956}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6884582649550298, "4": 0.30689675220387863, "3": 0.004495757970607517, "2": 9.684585182041421e-05, "1": 0}, "score": 4.683804632296379}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991147809877264, "4": 0.0008791535397935875, "3": 3.3336591947212692e-06, "2": 7.94275938079642e-08, "1": 0}, "score": 4.9991139385088585}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9981784449488367, "4": 0.0018087751056578402, "3": 1.0374973977950564e-05, "1": 4.679202320002404e-07, "2": 0}, "score": 4.998168599717943}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5657116403210622, "5": 0.38725257897166543, "3": 0.041091869476733996, "2": 0.005590031258333966, "1": 0.0002921348637978971}, "score": 4.334124872963371}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4992027964897509, "3": 0.4224865360626581, "5": 0.056709655031635345, "2": 0.021502686460568046, "1": 8.325003572289235e-05}, "score": 3.5909618293140713}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5278213314220865, "5": 0.43868901983174624, "3": 0.0316001566854894, "2": 0.001810622627070049, "1": 5.2344117271463386e-05}, "score": 4.403321283764939}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8555904445190963, "4": 0.13837360075261754, "3": 0.005777010180140208, "2": 0.00020065952332607562, "1": 3.280610276410232e-05}, "score": 4.8493353371328665}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8784097575206776, "4": 0.1195323778449676, "3": 0.001998077121802433, "2": 3.8809131154089685e-05, "1": 0}, "score": 4.876352446592432}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3238289288519593, "3": 0.3231052362500389, "4": 0.20908765772396265, "5": 0.07589571135983082, "1": 0.06791397827457288}, "score": 2.9012055494086093}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6786996438674878, "5": 0.19944734745843598, "3": 0.09930453890128041, "2": 0.020701844011443704, "1": 0.001823688829035525}, "score": 4.053269275880937}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9001523429841359, "4": 0.0983312694671843, "3": 0.0014944261380163838, "2": 1.3038239737932676e-05, "1": 0}, "score": 4.898639859083707}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8976453427034377, "4": 0.09890663051321175, "3": 0.003313580341539656, "2": 0.00010503887901592241, "1": 1.64477642803272e-05}, "score": 4.894083928458594}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7862460066208278, "4": 0.19455758361956088, "3": 0.01831610228025994, "2": 0.0007816811008627519, "1": 7.8540668285127e-05}, "score": 4.766146308726716}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5080206614932199, "4": 0.38026498512746376, "2": 0.09159300269614289, "5": 0.01952170608345822, "1": 0}, "score": 3.327912025273374}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5503982345194285, "2": 0.40904854829330095, "4": 0.03925302765585074, "5": 0.0011882020461328187, "1": 0.00010035416287748859}, "score": 2.632375898439362}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6301854234276596, "3": 0.32284666171909315, "5": 0.036089222641589355, "2": 0.01076734862116934, "1": 0}, "score": 3.691673533504335}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6441137422966053, "4": 0.3499248366464496, "3": 0.005719438744474706, "2": 0.00021056629790742513, "1": 0}, "score": 4.637993214160423}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5421365890359922, "5": 0.21564705766738143, "3": 0.19042840153946186, "2": 0.049047866026637785, "1": 0.0018543983039271985}, "score": 3.9214901940148366}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8047616519012435, "1": 0.10622747432575162, "3": 0.08614040480349186, "4": 0.002016136949057735, "5": 0.0006314539755409492}, "score": 1.9858364095491299}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995116362923082, "4": 0.004699444353098423, "3": 0.00015679442586660194, "2": 1.4628147124441068e-05, "1": 1.0021828439127243e-05}, "score": 4.994902981031787}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8737381567783248, "4": 0.12405273767034729, "3": 0.0021367591793228172, "2": 3.09997939585377e-05, "1": 0}, "score": 4.8715754346728195}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9897942695342034, "4": 0.009762524053036584, "3": 0.0003422336044943101, "2": 3.924918022269342e-05, "1": 0}, "score": 4.989434609063046}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7262166083852971, "4": 0.25946901142004336, "3": 0.012865602523850012, "2": 0.001208447259577222, "1": 0.00018686614491729203}, "score": 4.710411494536878}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6189788715987752, "2": 0.3060960920556651, "3": 0.0498010604998778, "5": 0.014124299444911781, "4": 0.01073508102434347}, "score": 1.494531504657728}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7766274390709685, "4": 0.2195581195426193, "3": 0.0033813372893447603, "2": 0.00034746782054344614, "1": 4.9040209221579363e-05}, "score": 4.772432313497804}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8014002811152158, "4": 0.19212303593986804, "3": 0.005417764513477317, "2": 0.0005812221594094717, "1": 0}, "score": 4.7951999363280216}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9249909234540155, "4": 0.07409237155168887, "3": 0.0008074721440459538, "2": 4.718710036863277e-05, "1": 0}, "score": 4.924146416466641}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9870301469429179, "4": 0.01281779293841996, "3": 0.00013960912562024276, "2": 5.966512333583869e-06, "1": 0}, "score": 4.986885004229402}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9214784849514558, "3": 0.05405302877103615, "1": 0.023759044498640698, "4": 0.0006370747897139342, "5": 7.202235507403503e-05}, "score": 2.0317842118709675}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6151189593766714, "3": 0.318085838575455, "4": 0.047570602646167456, "1": 0.010156900015235741, "5": 0.009059131721489914}, "score": 2.43025122526538}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.9189293432200495, "3": 0.0791311402209536, "1": 0.001770830559147495, "4": 0.00016176207097673325, "5": 6.215657786912112e-06}, "score": 2.07770253581158}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8406114208147718, "4": 0.15374012530755243, "3": 0.005485377300099559, "2": 0.0001489633880496442, "1": 1.1716997413803616e-05}, "score": 4.834794966075446}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.44947108687410003, "4": 0.43530177185912333, "3": 0.09887609286096545, "2": 0.015663492388015628, "1": 0.0006651187246069825}, "score": 4.317279771962549}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7977706809984879, "3": 0.1207487667200698, "1": 0.04275837484409349, "4": 0.034912016385304355, "5": 0.0037911290571168363}, "score": 2.159190841537224}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5664736348617652, "4": 0.4276709446525314, "3": 0.005781055502964112, "2": 6.505834989888051e-05, "1": 0}, "score": 4.56056767965658}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9926222194297517, "4": 0.007340812849856118, "3": 3.611284278768539e-05, "2": 3.098737129650767e-07, "1": 0}, "score": 4.992586027802786}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9754443131419716, "4": 0.024177382264883633, "3": 0.00036626648075388, "2": 1.0075135510986456e-05, "1": 1.1353699647638654e-06}, "score": 4.975055297242808}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.85575181553703, "4": 0.14262366942904192, "3": 0.0015918204190927447, "2": 2.765195851874761e-05, "1": 2.2964295747290295e-06}, "score": 4.85410014746484}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9788124840996653, "2": 0.021167688231726607, "3": 1.221047949418144e-05, "5": 2.8051910606208504e-07, "4": 0}, "score": 1.0211933867560243}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.629174239693856, "1": 0.1794740948236361, "3": 0.09383071730308294, "4": 0.05213568666108207, "5": 0.045366392561769296}, "score": 2.154730093082326}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9410383911334725, "4": 0.05543495098205653, "3": 0.003129054176899298, "2": 0.00024336991212160918, "1": 0.00013297625227613687}, "score": 4.93704358762002}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8661583282950519, "4": 0.1296408946109743, "3": 0.003584633649395966, "2": 0.000535695851061008, "1": 6.94727478192786e-05}, "score": 4.861303337371302}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9517330749133052, "4": 0.044139795992168995, "3": 0.003349761934495677, "2": 0.0005290579424831099, "1": 0.0002315726293381448}, "score": 4.946646322835513}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9028188940310962, "2": 0.09631646487252557, "3": 0.0008276377494289811, "4": 1.971834770655935e-05, "5": 1.553138100148011e-05}, "score": 1.0980931929565219}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5318148907005873, "4": 0.4588957816184697, "3": 0.00908119942344193, "2": 0.00017364805144507074, "1": 0}, "score": 4.52240440778588}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9947407482464034, "4": 0.005208979061003285, "3": 4.317849446390236e-05, "1": 3.4648957928091507e-06, "2": 2.0688265406581837e-06}, "score": 4.994684589592707}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9749215721891705, "4": 0.024749457732634657, "3": 0.00030006153130172767, "2": 1.1484652260404082e-05, "1": 0}, "score": 4.974615522951527}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9822422535587156, "4": 0.0175421363624416, "3": 0.0002066985719717961, "2": 5.1275556182935075e-06, "1": 2.6198670126763574e-06}, "score": 4.982018583426825}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9431939293570021, "1": 0.03953126109327054, "3": 0.017040910941527838, "4": 0.0002016248027138449, "5": 3.1221112790450975e-05}, "score": 1.9780065396397013}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.43488939699698337, "2": 0.23285677825824647, "4": 0.2208793840461082, "5": 0.10583990042317508, "1": 0.005519807458544165}, "score": 3.188665571292449}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6996679875193665, "4": 0.29179578144680335, "3": 0.008454808045199142, "2": 7.790292949140342e-05, "1": 2.31480756303508e-06}, "score": 4.691051262083119}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6434953487640322, "4": 0.33298501167488614, "3": 0.02111020724046072, "2": 0.002211008793400682, "1": 0.00013070783404434008}, "score": 4.617612822515028}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4019504848356652, "3": 0.2655205872168267, "5": 0.2561960262457142, "2": 0.07196877029239641, "1": 0.004339017669163917}, "score": 3.833716669440234}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9986864583520334, "2": 0.0013028807559904148, "3": 4.3770131299495894e-06, "4": 0, "5": 0}, "score": 1.0013116430244562}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7147352246832718, "3": 0.25043571954240373, "1": 0.02102505409998331, "4": 0.011153867279508426, "5": 0.002638132496051602}, "score": 2.2596359136135473}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5332035141608679, "5": 0.42276117816653885, "3": 0.04156204117605962, "2": 0.002329893780993757, "1": 8.338792860690103e-05}, "score": 4.376311758623332}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6416415272548384, "2": 0.16995875313306372, "4": 0.1456176395211993, "5": 0.030630072229835353, "1": 0.012139378367194531}, "score": 3.0126404337556973}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.477430967592301, "3": 0.4764039739076467, "5": 0.03713612735627565, "2": 0.00900430934617652, "1": 2.094656262996286e-05}, "score": 3.542659014232802}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6790948299379301, "1": 0.31164966208658923, "3": 0.008934634837324698, "4": 0.00024896505816529194, "5": 6.493329797220466e-05}, "score": 1.6979755962066017}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8515280394024546, "4": 0.14008635851622467, "3": 0.006013395589790429, "2": 0.0018138571119305094, "1": 0.0005045293214691196}, "score": 4.840418573000849}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9759747654256143, "4": 0.023833533961992896, "3": 0.00016500611898396703, "2": 6.8511708040231495e-06, "1": 0}, "score": 4.975815420385211}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998772798807299, "4": 0.00012212786357188398, "3": 3.4351673754282415e-07, "1": 2.0410384938774218e-08, "2": 0}, "score": 4.999877103433352}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9918298942220188, "4": 0.00812509791306644, "3": 2.9801897261090278e-05, "2": 1.0882441849669012e-06, "1": 0}, "score": 4.991811917962777}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5170407435182717, "3": 0.2501490596999052, "5": 0.1468652763279313, "2": 0.08333630420195512, "1": 0.0025929527363303573}, "score": 3.72226039963656}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7629587439487447, "4": 0.2343237904993886, "3": 0.0026279557931013003, "2": 6.78611399631267e-05, "1": 0}, "score": 4.7602115234051965}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.942506493526892, "4": 0.0569967973253906, "3": 0.00045359220066486494, "2": 5.542904037790651e-06, "1": 0}, "score": 4.942077213167883}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9826608457016826, "4": 0.017217000192620385, "3": 0.00010815739831491709, "2": 4.504295774450708e-06, "1": 0}, "score": 4.9825530065093835}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.828593610970791, "4": 0.1698464475183375, "3": 0.001450471359294049, "2": 6.0190020007435844e-05, "1": 0}, "score": 4.827063517370434}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8670724254436694, "2": 0.12918078779084768, "3": 0.0034449875102320346, "4": 0.0001857910319448455, "5": 8.597474221689655e-05}, "score": 1.1369761487465868}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5622407162848857, "4": 0.23445772137368673, "3": 0.14529710978012286, "1": 0.03835719326185749, "5": 0.019564386124881865}, "score": 2.6346011090487744}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8429399813630368, "5": 0.10935424634626728, "3": 0.04612201011857235, "2": 0.0015408972536201143, "1": 2.192532930952769e-05}, "score": 4.060085923907089}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7550973482239053, "4": 0.23983981883161185, "3": 0.004880340436365488, "2": 0.00015905396671974308, "1": 1.8641281519946216e-05}, "score": 4.74984657321842}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6181201270957724, "4": 0.37570053589969393, "3": 0.005875490106784313, "2": 0.0002883146902163868, "1": 1.2228906787946108e-05}, "score": 4.611633341297064}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5851142802348299, "3": 0.3446841805148435, "4": 0.05826239030832024, "1": 0.006680396078518248, "5": 0.005141260480035655}, "score": 2.4700075688025716}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6530124395763107, "4": 0.15729436387176132, "2": 0.13818255579006702, "5": 0.04503869364053308, "1": 0.003380177689537251}, "score": 3.102746508497883}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6993469415790726, "5": 0.18358116375240768, "3": 0.11232863085489235, "2": 0.0037657810087492346, "1": 0}, "score": 4.0637833179765765}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5315708968359188, "5": 0.42721802451904073, "3": 0.03948211083160417, "2": 0.0016370665954855313, "1": 7.650824845523592e-05}, "score": 4.384238170317533}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6266988730386829, "3": 0.21204215070347834, "5": 0.14164901591916823, "2": 0.01933716088284014, "1": 0.00021151703901590258}, "score": 3.8902912691167875}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8136287484518988, "1": 0.14109141011088566, "3": 0.0399787186579308, "4": 0.004241666688781274, "5": 0.0010196360796557188}, "score": 1.9104259833252593}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3215476611828325, "3": 0.319274258835815, "2": 0.2876518742393968, "5": 0.06517788856542954, "1": 0.006290539757174448}, "score": 3.1516792481954763}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.528859276749253, "2": 0.45154095567291835, "4": 0.018370367031767827, "1": 0.0007908138127615371, "5": 0.00043785489168579145}, "score": 2.5661231759875824}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9423063056754286, "4": 0.05605127960606172, "3": 0.001464204774400469, "2": 0.00013219096186724185, "1": 3.749387393748298e-05}, "score": 4.940473254991838}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6860177547715457, "3": 0.1549837509715202, "1": 0.11789575230915544, "4": 0.033680171418434046, "5": 0.0071226815661797165}, "score": 2.125854128461867}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"4": 0.46110670433644557, "3": 0.2226549088664051, "2": 0.18485835422564423, "5": 0.11459565384320683, "1": 0.016362137537760568}, "score": 3.472915066942583}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7210913360783985, "4": 0.2528007120651479, "3": 0.025147326255410704, "2": 0.0009094559448925684, "1": 4.479535979106535e-05}, "score": 4.693995135584495}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.57045870281722, "5": 0.39776229534426116, "3": 0.030452079343951742, "2": 0.0011585867912263029, "1": 0}, "score": 4.365054494122883}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962035863692463, "4": 0.0037475705585474726, "3": 4.573722683903742e-05, "2": 1.3081835317223837e-06, "1": 0}, "score": 4.9961570235288075}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4493410062948244, "4": 0.4344012338551838, "3": 0.08473987575292384, "2": 0.028156594188989546, "1": 0.003288964188823649}, "score": 4.29844263467566}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9527690754160926, "3": 0.039606778544673156, "1": 0.00756240286503922, "4": 5.742567815817404e-05, "5": 3.3267889449018794e-06}, "score": 2.032169239273079}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9808256166729505, "1": 0.014484234455546077, "3": 0.0046704399688210305, "4": 1.151407912114834e-05, "5": 0}, "score": 1.9902091534372572}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.49971838461698803, "5": 0.45773545999787557, "3": 0.04171941796206392, "2": 0.0007766842195880962, "1": 2.5909729588852588e-05}, "score": 4.414394949341511}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.464897233986003, "3": 0.38561703473662245, "5": 0.10213470497113022, "2": 0.04648615744787919, "1": 0.0008523400423662183}, "score": 3.6209835865847464}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9244935545517265, "1": 0.06539141488547857, "3": 0.009986237339120938, "4": 0.0001152091944446241, "5": 1.3192975884044386e-05}, "score": 1.9448647982093785}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6468699172180297, "3": 0.15831228647144874, "5": 0.14570343357474574, "2": 0.04470712473585457, "1": 0.003527125661235938}, "score": 3.887296328756203}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.522449683135225, "4": 0.2975227756857184, "2": 0.17106261840629422, "5": 0.007498354368865577, "1": 0.001444518111338298}, "score": 3.1385708853230403}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9426227899799379, "4": 0.05701176094857815, "3": 0.00033803132136979994, "2": 3.985323777355133e-06, "1": 0}, "score": 4.942298868359833}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7216267287276708, "4": 0.27484007388229587, "3": 0.0034959909844878385, "2": 3.2338276447317025e-05, "1": 3.096816220099108e-06}, "score": 4.718058042647087}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8960874278876012, "4": 0.101029937012108, "3": 0.002733790968211474, "2": 0.00012687236206376703, "1": 1.4738904434250009e-05}, "score": 4.893062134880337}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.34049327634655496, "2": 0.2568590212618085, "4": 0.17095819945384574, "3": 0.1286994291369793, "1": 0.10280325120020913}, "score": 3.389552005603486}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4874759125104185, "3": 0.2531674883493839, "4": 0.21360072023822063, "5": 0.0371332494179271, "1": 0.00839529625178696}, "score": 2.7835515081248063}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9929255915752666, "4": 0.00705040370977215, "3": 2.2642406864735328e-05, "2": 5.09375179784592e-07, "1": 0}, "score": 4.992902777297504}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8660555040820828, "4": 0.13253327937476042, "3": 0.0013401048792300193, "2": 6.336461343857667e-05, "1": 0}, "score": 4.864595368039943}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8565420990527862, "4": 0.1408249851009072, "3": 0.0025294636367569363, "2": 9.096506738830756e-05, "1": 1.0736686886934908e-05}, "score": 4.853799989759287}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"4": 0.513649938012652, "5": 0.45926806030941725, "3": 0.026543449099172625, "2": 0.000508355933111055, "1": 2.421076957584758e-05}, "score": 4.431637850765977}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7113008089211694, "5": 0.18928041239463925, "3": 0.09760823637846842, "2": 0.0017903192913151715, "1": 1.6365976201547078e-05}, "score": 4.0880427790892995}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9616687089680737, "4": 0.03805487812003035, "3": 0.00026663869985714135, "2": 1.3449550036572673e-06, "1": 0}, "score": 4.961407484309009}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.648436356237029, "4": 0.3449111263221302, "3": 0.006388600810896702, "2": 0.00022344930341466237, "1": 3.605128680007658e-05}, "score": 4.641495535828675}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9954204263726975, "4": 0.004553955878058783, "3": 2.396694424793979e-05, "1": 3.2707347405132806e-07, "2": 0}, "score": 4.995396795846143}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6445986009621937, "2": 0.17859105424644314, "4": 0.17221151832462955, "5": 0.004077154338347482, "1": 0.0004912790311688565}, "score": 3.0007922387711337}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5672094177332498, "3": 0.35684859171747074, "2": 0.06087692962072695, "5": 0.014741829232831188, "1": 0.00031102274917114053}, "score": 3.5352006353157925}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6961057016444626, "4": 0.17802172243218226, "2": 0.12360828567498408, "5": 0.0021197714557520827, "1": 0.00014378110774412831}, "score": 3.0583654605085315}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6799056367001322, "4": 0.31892679030894105, "3": 0.0011592268554485618, "2": 7.16598523147334e-06, "1": 0}, "score": 4.678732878880996}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6902444422480106, "5": 0.29733569270357807, "3": 0.012082912675712912, "2": 0.00031860387435513743, "1": 1.7723661556840867e-05}, "score": 4.284562579099652}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6086141084361524, "2": 0.25461125175048, "4": 0.12666661789111935, "5": 0.0076440661407919655, "1": 0.0023707917687166304}, "score": 2.882590976589037}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4383973666918171, "4": 0.35233544092012675, "2": 0.1645951099283076, "5": 0.03928350375533512, "1": 0.004785293109736485}, "score": 3.256891731363939}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5106926691219011, "3": 0.39146606764091524, "5": 0.0625311341420904, "2": 0.03481676692654413, "1": 0.00024497632126211304}, "score": 3.6005973977305277}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7181061569194721, "4": 0.2729395054801599, "3": 0.008566906328936074, "2": 0.00036461702565691645, "1": 1.6473376923015772e-05}, "score": 4.708765090594939}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.689648990670797, "4": 0.29643337223862565, "3": 0.012408142110976622, "2": 0.001317646089269347, "1": 0.00015197097641323767}, "score": 4.674176528205599}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4116891931017647, "1": 0.2601190417147913, "4": 0.14144585292142256, "5": 0.10463418126462046, "3": 0.08156895033704692}, "score": 2.418471296385554}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9612511661529523, "4": 0.036954764329303544, "3": 0.0016864576752207271, "2": 7.474434505450075e-05, "1": 2.1163384833310042e-05}, "score": 4.959362958125244}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9353937456468638, "4": 0.06284810472057582, "3": 0.0015583428468464936, "2": 0.00010952288884539586, "1": 0}, "score": 4.933700655155983}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9704536795025053, "4": 0.029133732025400493, "3": 0.00038301006107627526, "2": 1.3149208385155698e-05, "1": 0}, "score": 4.970060308342029}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9171592662166623, "4": 0.06994191269959621, "3": 0.009804099151454094, "2": 0.0020857217928875282, "1": 0.0009463548060311325}, "score": 4.90040106498622}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6349861191085159, "5": 0.2640989593632875, "3": 0.08196648785068499, "2": 0.01810769487205856, "1": 0.0007350309138324006}, "score": 4.143727182124379}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9941625000017844, "4": 0.00574279071223872, "3": 7.784896146334743e-05, "2": 2.4316366714108185e-06, "1": 0}, "score": 4.994094131240883}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9347044929207755, "4": 0.06441997649179888, "3": 0.0006651732665785905, "2": 5.551593285181088e-05, "1": 0}, "score": 4.934072920936059}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9244009434264003, "4": 0.07248094349623337, "3": 0.002846840204328367, "2": 0.00015544446941426681, "1": 0}, "score": 4.921349932775135}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.883952792429072, "4": 0.1120051529794862, "3": 0.0036243631096541076, "2": 0.00031363646423124123, "1": 0}, "score": 4.879792703236137}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9954706346543548, "2": 0.004486609432570766, "3": 2.4804834109955085e-05, "5": 5.774554733195394e-07, "4": 0}, "score": 1.0045386077747467}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8463984492934462, "4": 0.14447809133261638, "3": 0.008825583141402164, "2": 0.00011720863571040277, "1": 0}, "score": 4.837489756142231}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9677032893100543, "4": 0.031238945793080494, "3": 0.0008760126732080964, "2": 8.542028919374335e-06, "1": 0}, "score": 4.966977682971781}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9628407398888053, "4": 0.0345063401280935, "3": 0.0022284402002921712, "2": 5.881721345900313e-05, "1": 0}, "score": 4.96084601068261}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8866088187625303, "4": 0.1058527819228799, "3": 0.005514206593492385, "2": 0.0002557850793192111, "1": 0}, "score": 4.882143030486653}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"5": 0.850919601665918, "4": 0.14296413276613767, "3": 0.005717703729974642, "2": 0.0003403740152864574, "1": 0}, "score": 4.844570293611858}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9931650678317181, "4": 0.006746179057019996, "3": 8.098739764710637e-05, "2": 4.143933916188311e-06, "1": 0}, "score": 4.993079389281009}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9883302716972815, "4": 0.011427403412417022, "3": 0.00022361605878702998, "2": 9.439382434698263e-06, "1": 0}, "score": 4.988096935987859}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9888334440347627, "4": 0.0110120703856449, "3": 0.00014006653475495125, "2": 6.757240238555474e-06, "1": 0}, "score": 4.988687438149491}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999155826714922, "4": 0.0008346973115254295, "3": 6.017491980418011e-06, "1": 4.86025862228414e-07, "2": 0}, "score": 4.999151321078405}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.49226725930768006, "4": 0.29598337256582097, "1": 0.09059444330395736, "3": 0.06195929139438977, "2": 0.058471419481407945}, "score": 4.041611934982267}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6192672467320597, "4": 0.3087624092329529, "3": 0.05522959102717734, "2": 0.01224003674328614, "1": 0.004210741156953329}, "score": 4.527078198304701}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.552454224834965, "5": 0.31890095828513715, "3": 0.11606980518846184, "2": 0.01161636499090502, "1": 0.0008809827607854204}, "score": 4.176969218959267}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9925486901881713, "4": 0.007235393731445142, "3": 0.0001597598192886508, "2": 1.97941325507624e-05, "1": 0}, "score": 4.992385427350257}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7507630422313973, "4": 0.2153357157660123, "3": 0.022680766599735756, "2": 0.007419734530526171, "1": 0.003679920979477189}, "score": 4.702287893980279}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8976236414919577, "2": 0.08733014257127514, "3": 0.012403539544082395, "4": 0.001190570113035002, "5": 0.0011168444785135403}, "score": 1.1202166139511187}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7120749971795208, "3": 0.13785837347178098, "5": 0.11637438826302623, "2": 0.03264066419440437, "1": 0.0009762664565998344}, "score": 3.9102991316212488}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.7585388211702369, "3": 0.22424761803884524, "4": 0.011285918283281378, "1": 0.005610940087258708, "5": 0.00029957492642309887}, "score": 2.2421113860587196}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9224242779126666, "4": 0.07634235372559464, "3": 0.0010899210680458348, "2": 6.112314244982016e-05, "1": 0}, "score": 4.921287954808652}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7171249613183516, "4": 0.263210864996802, "3": 0.018791816433603444, "2": 0.0006957287504206776, "1": 0.0001084807304820665}, "score": 4.696663721271742}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.963576891454526, "4": 0.0361005672669801, "3": 0.00028759796728414254, "2": 3.0722388347931304e-06, "1": 0}, "score": 4.963313850855033}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8939085304285808, "4": 0.10469698061129924, "3": 0.0013033343677281177, "2": 8.372558099356919e-05, "1": 3.819503949231344e-06}, "score": 4.892429507617973}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9866036427139785, "4": 0.013356042163632684, "3": 3.5366341330636546e-05, "2": 7.738900714452002e-07, "1": 0}, "score": 4.9865708474182435}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9920430206965122, "4": 0.007857026908608952, "3": 8.381303614377152e-05, "2": 5.546746601583412e-06, "1": 0}, "score": 4.991958621600096}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9860631083657099, "4": 0.013742862232742221, "3": 0.00017621301187466023, "2": 1.2224382929400007e-05, "1": 0}, "score": 4.985867959568255}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"4": 0.516989848532572, "3": 0.4430820551575313, "5": 0.025178092696453953, "2": 0.014694239981194505, "1": 5.273305866187367e-05}, "score": 3.552548002364343}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5033244434586167, "4": 0.39227368766069887, "2": 0.06996953121826686, "5": 0.034138561425874674, "1": 0.00028606457097138654}, "score": 3.3900121577955686}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9722878853793862, "4": 0.02729609028638793, "3": 0.0004121076320058676, "2": 2.3002287119378913e-06, "1": 0}, "score": 4.971872748296508}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9905583152680939, "4": 0.009277953356387935, "3": 0.00015657287522164644, "2": 3.493868440282792e-06, "1": 0}, "score": 4.990398384101461}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9754875282331829, "4": 0.024210617557335137, "3": 0.00028872150066355876, "2": 9.032169181032432e-06, "1": 3.5940207360126658e-06}, "score": 4.975170454274217}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5076677402584666, "1": 0.3530638712609261, "3": 0.13890542126470662, "4": 0.00023337265601716613, "5": 0.00012927482414500885}, "score": 1.7866960515873545}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9475822428033366, "4": 0.04664718950094654, "3": 0.0052411517771662666, "2": 0.0002672569507441871, "1": 0.00025814502979260555}, "score": 4.941035919295154}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9935674922279767, "4": 0.0062354882186790835, "3": 0.00019477159375537532, "2": 1.2964821498689933e-06, "1": 6.802088184238924e-07}, "score": 4.99336835651313}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9831648185187007, "4": 0.015710069543840403, "3": 0.0011190255690530996, "2": 4.9330652922027095e-06, "1": 1.1279079644689995e-06}, "score": 4.9820325680340325}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8060074204534181, "4": 0.19094611713053994, "3": 0.0030263548605076393, "2": 1.6190806124616298e-05, "1": 3.8074914414239033e-06}, "score": 4.802937349233642}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6269361986912769, "3": 0.2659150452425794, "4": 0.05616740907458797, "1": 0.03900678397120776, "5": 0.01188487851417111}, "score": 2.3749313404951833}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6621424929892128, "2": 0.28018488223904287, "4": 0.0532439018606093, "5": 0.002599883610887381, "1": 0.0018179114350637296}, "score": 2.7746205010564333}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.995457636182314, "4": 0.004490803679671638, "3": 4.213136848776263e-05, "2": 1.140981158918788e-06, "1": 0}, "score": 4.995421472694012}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9818787173585413, "4": 0.017099295759099263, "3": 0.000925535563900677, "2": 7.405629579501879e-05, "1": 1.3509411057791448e-05}, "score": 4.980773255740101}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8938683447799866, "4": 0.10085957258986826, "3": 0.005080838357519956, "2": 0.0001567055486262143, "1": 2.4245488478802464e-05}, "score": 4.888410503478329}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8617198165156263, "5": 0.07037791305904467, "3": 0.05473462892125399, "2": 0.01277808097191232, "1": 0.0002870709959925263}, "score": 3.989224804861236}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6681653273731505, "5": 0.3075259208011254, "3": 0.02240357129537421, "2": 0.0015720119236261126, "1": 0}, "score": 4.282072303294783}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.634595875007455, "4": 0.3568509469259482, "3": 0.008158940166482328, "2": 0.00024933828730125233, "1": 0}, "score": 4.626028969621678}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5657509586463606, "5": 0.4270365808435902, "3": 0.006917060381272182, "2": 0.00023966246987916257, "1": 0}, "score": 4.419663586588401}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5318207672875975, "4": 0.4566272529324354, "3": 0.01110700487372106, "2": 0.00037357020718932173, "1": 0}, "score": 4.520003752710968}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7341171193128004, "4": 0.24411191275714303, "3": 0.01679396471955059, "2": 0.00419857540716741, "1": 0.0006761819238539178}, "score": 4.70696974275047}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7200611644176952, "4": 0.27051422345209625, "3": 0.008143121465942153, "2": 0.0011851601095236317, "1": 6.910330493790624e-05}, "score": 4.709359726732374}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9950614721267541, "4": 0.0049118417778787225, "3": 1.6475469174740153e-05, "1": 0, "2": 0}, "score": 4.995055156793826}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985264572318399, "4": 0.0014640803222839358, "3": 8.529447243720126e-06, "2": 3.2744966118188055e-07, "1": 0}, "score": 4.998517877536748}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9912381507011131, "4": 0.008670411732380718, "3": 7.883235885690408e-05, "2": 5.2358675827978505e-06, "1": 0}, "score": 4.991156150773826}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5869677506093344, "4": 0.3885410818412097, "3": 0.023942424738509598, "2": 0.0005247736138948383, "1": 1.570731547988698e-05}, "score": 4.561933299322966}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8410410746097414, "4": 0.1509846202505364, "3": 0.0072365840516151105, "2": 0.0006743073109511, "1": 3.713754891663913e-05}, "score": 4.832366334737265}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9586946800918101, "4": 0.04085847143934836, "3": 0.00043660812688186087, "2": 4.262639451480238e-06, "1": 0}, "score": 4.958255274850985}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939282007304608, "4": 0.005993186729842994, "3": 6.985834563597808e-05, "2": 1.6809020065033997e-06, "1": 0}, "score": 4.9938620104570735}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9039284047605837, "4": 0.09377910584203769, "3": 0.002176202268575132, "2": 9.16414846147553e-05, "1": 1.4804505468120328e-05}, "score": 4.90153337812141}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4529247600041929, "3": 0.28323418916400844, "1": 0.10676364639090492, "4": 0.08202185031154526, "5": 0.07503741673874952}, "score": 2.5656367527871646}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5294242942941472, "4": 0.43820968950698774, "3": 0.03171487389812112, "2": 0.0006187355486941124, "1": 2.8136806467890152e-05}, "score": 4.496389658436064}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984986489567917, "4": 0.0014912620561371248, "3": 8.477783686876422e-06, "2": 7.728584622453912e-08, "1": 0}, "score": 4.998491548205109}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960955927961959, "4": 0.0037697032279402315, "3": 0.00012092984184386954, "2": 5.511448961227796e-06, "1": 5.2800974709990914e-06}, "score": 4.995950770274423}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9760666363020774, "1": 0.012172569017143706, "4": 0.007783968351086545, "3": 0.0029960857267546416, "2": 0.0009374023177015566}, "score": 4.934718547987537}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6457133140513746, "5": 0.33640735071746647, "3": 0.016231540258787158, "2": 0.0014739199421810796, "1": 0.00013078549756154344}, "score": 4.316849266968459}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8767556900925159, "4": 0.12151895744728237, "3": 0.001635398456569732, "2": 7.402290393604543e-05, "1": 1.0826572814369343e-05}, "score": 4.874944232285984}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.796675862423742, "4": 0.20131023562773542, "3": 0.0019393205484702636, "2": 5.8605676351849824e-05, "1": 0}, "score": 4.7946320253442485}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7632096689260865, "4": 0.23266637929742284, "3": 0.003661831671725419, "2": 0.00037020598167509486, "1": 4.857507590824926e-05}, "score": 4.758694581163536}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.873516430172431, "4": 0.12533270970884897, "3": 0.0010924597213540438, "2": 4.612206910783715e-05, "1": 8.001088204280585e-06}, "score": 4.87231145413374}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5280535658226162, "4": 0.43582560682260685, "2": 0.02099698128342164, "5": 0.014828266812889929, "1": 0.0002802596676741117}, "score": 3.4439314406776274}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7227890281701401, "4": 0.23208736614323583, "3": 0.0443549306736144, "2": 0.0007156559666379847, "1": 5.271460532086502e-05}, "score": 4.676844847806643}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8069978458876109, "4": 0.18379082292244112, "3": 0.009053190879889707, "2": 0.00015251539746957915, "1": 5.302983347594768e-06}, "score": 4.79762397204122}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.7370724409262288, "4": 0.1953174295644383, "2": 0.0409895140445375, "5": 0.026110240115742495, "1": 0.0005093434574046982}, "score": 3.205529920921185}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6239592732314507, "4": 0.3182256043816528, "3": 0.056959670309548766, "2": 0.0007877380084305297, "1": 6.40498417724545e-05}, "score": 4.565234048525666}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5206576786060666, "2": 0.2563034461335518, "4": 0.19681887291572073, "5": 0.02388499121367058, "1": 0.0023076368193936975}, "score": 2.9836696885396887}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9491954100790632, "4": 0.0397796103789381, "3": 0.007495638207140144, "2": 0.002622008111538276, "1": 0.000882637476987955}, "score": 4.933830904869027}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9463141202904686, "4": 0.05286876331827155, "3": 0.0007678792989450037, "2": 2.0921651045765593e-05, "1": 0}, "score": 4.945531170821768}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9854606452270304, "4": 0.014273602880480645, "3": 0.0002467753868596794, "2": 1.374669673730777e-05, "1": 0}, "score": 4.985191528810113}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9696352307332522, "4": 0.029577489406419685, "3": 0.0007240576801764079, "2": 4.4220812883167937e-05, "1": 0}, "score": 4.96884114073365}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.41758736462312346, "3": 0.21823570165866266, "2": 0.14134311569364466, "5": 0.13833487540163256, "4": 0.0844976040042761}, "score": 2.3846486861468983}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6312720299947117, "3": 0.1328189309187988, "1": 0.10090925816343696, "4": 0.09323578236670492, "2": 0.041621892005656004}, "score": 4.112497527209842}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9712189314723204, "4": 0.028541925571236026, "3": 0.00023159601935488367, "2": 1.5546377463798846e-06, "1": 0}, "score": 4.970990044640478}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9700235504160504, "4": 0.02920369606937099, "3": 0.0007485747445289984, "2": 1.4159270349733305e-05, "1": 8.048345625617586e-06}, "score": 4.969224422584614}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8080274081973684, "4": 0.18370861329992946, "3": 0.008158878158772693, "2": 9.260439085460242e-05, "1": 1.1570034903950684e-05}, "score": 4.79964935156204}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6652204097555711, "3": 0.15721457295619995, "1": 0.15433029508995214, "4": 0.016673560795845768, "5": 0.006554778194132014}, "score": 2.0558960908367268}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5462698743416768, "2": 0.3392093196698694, "3": 0.07026760480200409, "4": 0.022262349291541143, "5": 0.021679633663358903}, "score": 1.633447252135526}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6348025076743629, "4": 0.29911516874648447, "3": 0.05869158021500713, "2": 0.006438656362483575, "1": 0.0009173733735864301}, "score": 4.560500951635201}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.41123997257342626, "3": 0.38853963258567725, "2": 0.1424338923853019, "5": 0.0519636678393089, "1": 0.005799373990078543}, "score": 3.361143140530812}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.8087760042918908, "2": 0.18201304839449872, "3": 0.008816255901968998, "4": 0.0002953545673900433, "5": 9.671935697447393e-05}, "score": 1.2009190272315022}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.44658929940287306, "4": 0.33638265932410905, "3": 0.15569009781703014, "2": 0.053337485623839886, "1": 0.007756853529624056}, "score": 4.160992888309559}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9722843948721431, "4": 0.026330884846996052, "3": 0.00123261136392936, "2": 0.00012406399956276803, "1": 2.3784534486438996e-05}, "score": 4.97073643761453}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5395949572719132, "5": 0.3567797979409208, "3": 0.08799678493507826, "2": 0.014899187466013337, "1": 0.000556065758513159}, "score": 4.237357552699505}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.905973729043769, "4": 0.09014762271569832, "3": 0.003713980746865631, "2": 0.00014219175841146919, "1": 1.145669823865581e-05}, "score": 4.901950933316087}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9806713920094637, "4": 0.018612622488744575, "3": 0.0006771040527756765, "2": 2.6332464194031288e-05, "1": 7.986092233428043e-06}, "score": 4.9799221360310515}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3070750496101133, "3": 0.26286720454675677, "5": 0.21872826908605073, "4": 0.17405805256160548, "1": 0.036821513450088286}, "score": 3.2309003987939486}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7330871420904876, "4": 0.18389101622112777, "3": 0.04201629330891113, "1": 0.02034765311069278, "2": 0.019946216554946647}, "score": 4.590555742290725}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9644825876879386, "4": 0.035130467678418646, "3": 0.0003431553492730885, "2": 5.027674534198248e-06, "1": 0}, "score": 4.964166749644963}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.98564057720162, "4": 0.013581591083245886, "3": 0.0005651343881319931, "1": 9.47467514573548e-05, "2": 9.367061735695317e-05}, "score": 4.98462776804544}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.33681374057986624, "4": 0.2230491339895051, "1": 0.1745727532778578, "2": 0.1369427395517085, "3": 0.1279432337192669}, "score": 3.4108671008235785}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"2": 0.45613283822221445, "3": 0.3583896416303702, "4": 0.17516091732389427, "5": 0.007849860641661393, "1": 0.0024123705119372912}, "score": 2.7298883729408994}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.5958065173148661, "2": 0.37623805911277863, "3": 0.027471966342068433, "4": 0.0004161440847911286, "5": 5.1423772110378195e-05}, "score": 1.4326429935657976}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6951648689771998, "4": 0.2927673244342315, "3": 0.01177142258120935, "2": 0.00027755262586526145, "1": 1.3315137660480526e-05}, "score": 4.682802162234497}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5871730491260759, "3": 0.2850773876381904, "5": 0.09384014776404462, "2": 0.03139290710375519, "1": 0.0025061501703049476}, "score": 3.7384557862807744}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8750806460126743, "4": 0.11863366255719887, "3": 0.005757804731060331, "2": 0.000471945710085235, "1": 5.144856434298346e-05}, "score": 4.86822850461954}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.36092409713506374, "3": 0.3495222000042759, "2": 0.2743514857401798, "5": 0.013401196298535839, "1": 0.0016895805096510755}, "score": 3.110008102309929}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.871251670107176, "5": 0.10061588813894459, "3": 0.025028034559838052, "2": 0.0027787002404963852, "1": 0}, "score": 4.07005326993525}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8741174501783586, "5": 0.07659486048367327, "3": 0.045804886564743436, "2": 0.003375951731135756, "1": 5.6876289979052186e-05}, "score": 4.02386863441581}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.793936512499927, "5": 0.10297505546852768, "3": 0.0928037157112169, "2": 0.01008242973748771, "1": 0.00016552919067485845}, "score": 3.989509507107149}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5875966123091525, "4": 0.4076043685308522, "3": 0.0044957354918738575, "2": 0.0002569690264453581, "1": 0}, "score": 4.582613922319436}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8143664907239844, "1": 0.1286094096434046, "3": 0.05533416219379279, "4": 0.0013869821600345084, "5": 0.0002616703637418614}, "score": 1.9302808496124821}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5451499742851368, "3": 0.253003337156427, "5": 0.1457122051854698, "2": 0.053396055648734224, "1": 0.0026887593498280088}, "score": 3.7778394443284333}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7277739407171524, "3": 0.1806166228276191, "5": 0.07963719670430691, "2": 0.011804233980043604, "1": 0.00014121810764717804}, "score": 3.874985102736692}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8387440035429112, "4": 0.12673531515348474, "3": 0.028799058020404115, "2": 0.0039084187443173945, "1": 0.0018019845385387069}, "score": 4.796731093741402}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.38639554740080884, "3": 0.36113706906986004, "2": 0.17210221593336103, "5": 0.07434269964017994, "1": 0.005873755918083635}, "score": 3.3512834589906393}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3882527476368569, "5": 0.26199836911298846, "3": 0.21584761637743466, "2": 0.12866473644766857, "1": 0.005219686167831565}, "score": 3.7731584003584695}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4297416778511476, "5": 0.21876917509696261, "2": 0.19960463378869953, "3": 0.1437484330335879, "1": 0.008106560555571622}, "score": 3.6514815046668847}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.688176818799253, "5": 0.2956539193738568, "3": 0.01523419510356784, "2": 0.0008657459956399797, "1": 4.022833338618616e-05}, "score": 4.278575651711551}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9944295468329933, "4": 0.005505147584463525, "3": 3.534929886168015e-05, "2": 2.743804766133856e-06, "1": 0}, "score": 4.994415770442786}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8332316868613362, "4": 0.16471741659503475, "3": 0.0019378697039455282, "2": 9.135893219572885e-05, "1": 0}, "score": 4.831129108121624}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6200186628655434, "2": 0.3795552638330237, "3": 0.0004226378044366382, "4": 1.4645800673974928e-06, "5": 9.469268411670598e-07}, "score": 1.3804091104246223}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7798238641429012, "2": 0.21541846364285888, "3": 0.004529136390207752, "5": 0.00013819995116437207, "4": 8.476320607069333e-05}, "score": 1.2252850812848362}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.916401519761583, "4": 0.08218623897481298, "3": 0.0013570251021937736, "2": 3.8130884019782354e-05, "1": 9.495040009166032e-06}, "score": 4.914946692433909}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99053012735119, "4": 0.009222135981215013, "3": 0.00023283279035158445, "2": 6.922746320093948e-06, "1": 0}, "score": 4.990291352713136}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8130627574321816, "4": 0.18060264364201367, "3": 0.0061513666643856725, "2": 0.0001212379396376284, "1": 5.075248376792799e-05}, "score": 4.806525724268763}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9951596792908579, "4": 0.004805484544099699, "3": 3.230395142754161e-05, "2": 9.354800658601723e-07, "1": 0}, "score": 4.995127093332114}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9980979216481499, "4": 0.0018854966839096988, "3": 1.2904648018262869e-05, "2": 4.793583011787864e-07, "1": 0}, "score": 4.998087249828822}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998596400713766, "4": 0.0001381345980447024, "3": 6.914472307730106e-07, "1": 0, "2": 0}, "score": 4.9998604822934904}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995788292173251, "4": 0.00041746952932061453, "3": 3.005447748235369e-06, "2": 1.0609838637200943e-07, "1": 0}, "score": 4.999576201030107}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994198526505887, "4": 0.0005734548222494891, "3": 2.814285914875751e-06, "1": 0, "2": 0}, "score": 4.999420914360088}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7745439302083077, "3": 0.1673663594837731, "1": 0.04125592253093716, "4": 0.015567023193733069, "5": 0.0012390057939927757}, "score": 2.16096596894269}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9424483737710095, "4": 0.05698653882516475, "3": 0.0005474298129590221, "2": 7.378102988669874e-06, "1": 0}, "score": 4.941895869959251}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6049061239595196, "4": 0.3832219322693149, "3": 0.011564425040642526, "2": 0.0002445947007277653, "1": 0}, "score": 4.592889816533902}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8676951289043955, "4": 0.1308041254917008, "3": 0.0014627742135340262, "2": 1.511982895162636e-05, "1": 0}, "score": 4.866221909556125}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9922053108790035, "4": 0.0077439955782381414, "3": 4.9505142742417625e-05, "2": 6.019966237752965e-07, "1": 0}, "score": 4.992155183546179}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5975014311196555, "3": 0.22529980433693425, "5": 0.09641941473282568, "2": 0.07716768481994891, "1": 0.0035577021713553915}, "score": 3.70609527431433}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.626497183667058, "5": 0.24373207750308068, "3": 0.1266248881158822, "2": 0.003076462134005675, "1": 5.910470653033266e-05}, "score": 4.1107780902274556}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9937050765726945, "4": 0.006245113256628678, "3": 3.16631187747738e-05, "1": 0, "2": 0}, "score": 4.993691446024165}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9827954234404048, "4": 0.017154282981818245, "3": 4.775778345634186e-05, "2": 5.573496812576332e-07, "1": 0}, "score": 4.982748495271078}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7680307558166861, "4": 0.22233360496583046, "3": 0.008772833804422488, "2": 0.0006592374959464156, "1": 0.00010075336078765407}, "score": 4.75771509107892}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6925169255443827, "1": 0.21894458887848528, "3": 0.07878915645707214, "4": 0.00697940925321094, "5": 0.0027513570948306393}, "score": 1.8820552679883296}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9413842298135019, "4": 0.05768553096996105, "3": 0.0008043800511802768, "2": 3.598004783335092e-05, "1": 0}, "score": 4.940592429284148}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8945293812593696, "4": 0.10416157288223446, "3": 0.0012717980403242739, "2": 3.243323140981123e-05, "1": 2.1958639275760626e-06}, "score": 4.8931884681773905}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5488497249432391, "5": 0.37124635763408365, "3": 0.07230760273150524, "2": 0.007119370289183008, "1": 0.0004725410199923685}, "score": 4.2832836386703095}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7742660736965881, "4": 0.2183080587862938, "3": 0.0072462969943323735, "2": 0.0001470046998394033, "1": 0}, "score": 4.766750737171328}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7362519466596043, "3": 0.22003399980552266, "4": 0.04048146758864131, "1": 0.0019272277647221115, "5": 0.0012934502740792786}, "score": 2.302953665584526}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7985523604213177, "5": 0.1788576930900625, "3": 0.02137152821588404, "2": 0.001167443457501009, "1": 3.356492281984028e-05}, "score": 4.155053282651686}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9945177412308197, "4": 0.005466146990785632, "3": 1.0889538502680273e-05, "1": 0, "2": 0}, "score": 4.994512045272792}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9871033191868732, "4": 0.012867270013988132, "3": 2.7377802517474985e-05, "2": 3.2354099748987284e-07, "1": 0}, "score": 4.987076981666657}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6429721939019701, "5": 0.3426877144600284, "3": 0.01374224519208064, "2": 0.0005655583979068823, "1": 2.554065657441072e-05}, "score": 4.327739941892089}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9536877187093536, "3": 0.02354951625310763, "1": 0.0226910614673475, "4": 6.694286925589328e-05, "5": 4.454726012745487e-06}, "score": 2.001005705010031}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.44196285009306624, "2": 0.32786868544900005, "4": 0.11463418737915335, "1": 0.06383957392308472, "5": 0.05167529317451588}, "score": 2.7624323292489974}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5760200268810257, "5": 0.3865526723127479, "3": 0.036722585664831435, "2": 0.0006665162750259868, "1": 2.6449137735061255e-05}, "score": 4.348421800546265}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8160717328314684, "4": 0.16539642680192423, "3": 0.01804585970029114, "2": 0.0003176841206988861, "1": 0.00014451098970238367}, "score": 4.79697592843618}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4062608248128544, "3": 0.3776647430725649, "5": 0.15825870683134383, "2": 0.053481659336245914, "1": 0.004328416535674319}, "score": 3.660643478314691}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6252507185529744, "1": 0.37442609448469416, "3": 0.00031721302710167393, "4": 1.206414283489853e-06, "5": 0}, "score": 1.6258917478020463}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7228427189332028, "4": 0.27079315912164753, "3": 0.006260260383042145, "2": 9.920471644452359e-05, "1": 3.5619372135241825e-06}, "score": 4.716374147669738}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5565899255701414, "4": 0.4324362942461922, "3": 0.010906994481446934, "2": 5.876724006926244e-05, "1": 0}, "score": 4.545569771239117}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9665757730266957, "4": 0.032585922794126435, "3": 0.0007668929009879221, "2": 5.207508180037195e-05, "1": 1.3869727091537517e-05}, "score": 4.965668399577491}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.44120445243761686, "3": 0.2759449747469715, "5": 0.19261087828164605, "2": 0.0861065841076538, "1": 0.004119720325850152}, "score": 3.7320899869998807}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6783450752313502, "5": 0.20681096820759232, "3": 0.09787988649916815, "2": 0.01611969117444518, "1": 0.0007946710520047634}, "score": 4.074311380061371}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.372229953916129, "4": 0.364424457015194, "2": 0.19855671535349895, "5": 0.06060964137283914, "1": 0.004053705005014125}, "score": 3.279014638361973}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7218978587301217, "4": 0.2746954086698558, "3": 0.00325259870699394, "2": 0.00012528981303072613, "1": 0}, "score": 4.7184154024284055}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9411243288010424, "4": 0.05870920207229613, "3": 0.00016132799972790664, "2": 3.486239185685702e-06, "1": 0}, "score": 4.940957585502122}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.647986205930971, "5": 0.3181739287396769, "3": 0.0314490343688569, "2": 0.0022525204268478314, "1": 9.220677025499717e-05}, "score": 4.2819562324497875}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5631775142035784, "3": 0.26643349932622035, "4": 0.12742428932166916, "1": 0.028913840166622237, "5": 0.013969791928363883}, "score": 2.5343209283426953}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9903616015020955, "4": 0.009465619924047384, "3": 0.00015405806209752677, "2": 9.300959417071924e-06, "1": 0}, "score": 4.990198268745585}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9584074991460595, "4": 0.04119990205233467, "3": 0.00034624934228584336, "2": 3.538686304914459e-06, "1": 0}, "score": 4.958095189226837}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990698346526203, "4": 0.009163326602620907, "3": 0.00011227515033525602, "2": 4.469996197546039e-06, "1": 0}, "score": 4.990598510207752}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.904604099600761, "4": 0.08595480019686173, "3": 0.007316930277226339, "2": 0.001729593273735889, "1": 0.0003000501291801799}, "score": 4.893012245730424}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5449870751070586, "3": 0.2237795865897832, "1": 0.13918796404696446, "4": 0.07398747920694758, "5": 0.017752049587651204}, "score": 2.285910174048824}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5460279576832845, "4": 0.4154302453531995, "3": 0.03595768314949754, "2": 0.0023882855823579765, "1": 0.00016207749060997482}, "score": 4.5048245090985235}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.67551040384868, "4": 0.317270898703295, "3": 0.006986575897862168, "2": 0.00016867664820751396, "1": 0}, "score": 4.668228870369567}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9854939888520493, "4": 0.014415483600971734, "3": 8.126606769983221e-05, "2": 1.95309551588982e-06, "1": 0}, "score": 4.985416018391746}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8610246030428526, "4": 0.13181969989333564, "3": 0.006535374021208265, "2": 0.00045284996066695247, "1": 0.0001463171546716304}, "score": 4.85316262708278}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5048100444867225, "5": 0.47093424590909044, "3": 0.02170745997204671, "2": 0.001792245457066542, "1": 0}, "score": 4.445979457354668}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8558270051945763, "4": 0.13916817292565906, "3": 0.004503432028018698, "2": 0.00036547597968138905, "1": 8.581085880324094e-05}, "score": 4.850377795120732}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.972755113874465, "4": 0.026887714681097158, "3": 0.0003221552454112995, "2": 5.4646089185687755e-06, "1": 0}, "score": 4.97245076687768}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9860144305897869, "4": 0.01354854659189832, "3": 0.00022246050004623677, "2": 2.3952712110419836e-05, "1": 0}, "score": 4.985931992774361}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969776663736875, "4": 0.0029912120674266, "3": 2.6080047489267077e-05, "2": 1.5142004713360177e-06, "1": 0}, "score": 4.9969520744852}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.45113772913123645, "2": 0.23051003078197338, "4": 0.2168557918591064, "5": 0.07234308554462769, "1": 0.029107244031316187}, "score": 3.0728208025009858}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7772448313383203, "4": 0.21871282741535067, "3": 0.003883839705007904, "2": 0.00013121137309971353, "1": 1.3739165611212766e-05}, "score": 4.773067827234424}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7638863938665349, "4": 0.19472164534089273, "3": 0.03929711391818008, "2": 0.001956018009697675, "1": 0.00011367773485483024}, "score": 4.72035432844964}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6726007934505239, "5": 0.22661784100827873, "3": 0.0934009184765176, "2": 0.006967491629307459, "1": 0.0004026739824365397}, "score": 4.118075131309743}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5086231550476825, "5": 0.21689521982595997, "3": 0.21642907139948905, "2": 0.0542308957855431, "1": 0.003789955505235956}, "score": 3.8806307060422647}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.766138818856274, "3": 0.15150153834376623, "1": 0.05254601064262437, "4": 0.026790618733597282, "5": 0.0029244185628198426}, "score": 2.1613259267641074}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5416136254106024, "2": 0.23123286560866044, "4": 0.211695999085914, "5": 0.011734966551532498, "1": 0.003707878866359435}, "score": 2.996517257775006}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9417482882861605, "4": 0.056073984971828396, "3": 0.002014510582866868, "2": 0.0001348739391294806, "1": 2.1024229492131964e-05}, "score": 4.939407831714168}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9700913118377593, "4": 0.029355187563373287, "3": 0.0005164190549909116, "2": 1.8373943704263245e-05, "1": 0}, "score": 4.9695562829666455}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.2901678007684709, "5": 0.2255548753447504, "4": 0.21813295865948934, "3": 0.14859410763622047, "1": 0.11739390376273308}, "score": 3.144309664423551}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"2": 0.823123671876201, "3": 0.16939947431266827, "1": 0.005235072424944188, "4": 0.0021105822957858604, "5": 0.00012834982681067528}, "score": 2.168771096833069}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5564706778228531, "3": 0.3763165279792903, "2": 0.037286684499273, "5": 0.029803954289361764, "1": 0.00010441846816794265}, "score": 3.578593327441711}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9054428300367521, "4": 0.09257057985131836, "3": 0.0017748222533974665, "2": 2.0457970416310243e-05, "1": 0}, "score": 4.903799997718965}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9546400638852143, "4": 0.044322696357608285, "3": 0.0009139226665420264, "2": 7.271440863564015e-05, "1": 0}, "score": 4.9536289685848445}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9427669676198103, "4": 0.05610756651826387, "3": 0.0009244745831976362, "2": 2.2554521548203504e-05, "1": 0}, "score": 4.941965465256511}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6776704982196728, "5": 0.13482454668659852, "3": 0.12252077151302088, "2": 0.061192857731985094, "1": 0.0035347252691810063}, "score": 3.8792829078262527}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7115221147969398, "4": 0.28154654463731243, "3": 0.0060107965606975775, "2": 0.0007273336826275172, "1": 0}, "score": 4.704192708171181}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8562082069486124, "4": 0.14130648430568987, "3": 0.0023930848813491345, "2": 5.9193489309641545e-05, "1": 0}, "score": 4.8537249339433925}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8009892121355822, "5": 0.16835694178180582, "3": 0.028145409796045028, "2": 0.0023686751229435375, "1": 8.103041337492202e-05}, "score": 4.135239033189631}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9822537576473571, "4": 0.017624001224552488, "3": 8.344231526447634e-05, "2": 4.564256166090445e-06, "1": 0}, "score": 4.982194811823696}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7420299891405631, "5": 0.1507873368616799, "3": 0.10156320143957101, "2": 0.004902540690398084, "1": 0.0006202497118271804}, "score": 4.037561936474832}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6668421751704819, "2": 0.31801656702375913, "3": 0.013085088232452843, "5": 0.001259465568475786, "4": 0.0006957711911688833}, "score": 1.3513473818158939}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8713308443436656, "4": 0.12617258336255774, "3": 0.0024554687477857376, "2": 2.9200681789708544e-05, "1": 0}, "score": 4.868827315765855}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9587343497810035, "4": 0.04079000512537273, "3": 0.0004633158291658607, "2": 8.636933129721189e-06, "1": 2.714181834732117e-06}, "score": 4.958246554848456}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5789762796717907, "5": 0.3833418228396364, "3": 0.03661445028369285, "2": 0.0010169577566456417, "1": 4.5234974419007153e-05}, "score": 4.344559562598594}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5538775752270197, "2": 0.36732454606743864, "1": 0.07145604311116058, "4": 0.00590704247536384, "5": 0.0014287929243742255}, "score": 2.498524987086667}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5963867159889465, "2": 0.39158126956433376, "4": 0.007702001876125942, "1": 0.0038028469324674656, "5": 0.0005142688370299915}, "score": 2.609538540417137}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6226464794316501, "4": 0.3466389259551234, "3": 0.030603833502834826, "2": 9.688605118971189e-05, "1": 0}, "score": 4.591857085878542}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.48308963153972734, "3": 0.3034975927940107, "5": 0.2091045108683478, "2": 0.004171373170065878, "1": 0.00013291110987371363}, "score": 3.8968650278739743}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.7951659452075739, "2": 0.158126394589643, "4": 0.040271518373487324, "5": 0.003409592828322827, "1": 0.002993996086798751}, "score": 2.882972507680979}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.49791166361041006, "4": 0.3952826382832828, "3": 0.06996716628807921, "2": 0.031041048662741117, "1": 0.005637512820554034}, "score": 4.349005692092644}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7371510686370367, "3": 0.20773750322585083, "5": 0.03197933711188134, "2": 0.022960424936838766, "1": 0.00016656282373187412}, "score": 3.7778201616986404}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7136856569188778, "4": 0.2818252728212579, "3": 0.004371989982307295, "2": 9.443932435476e-05, "1": 0}, "score": 4.709140843912522}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9924364348132555, "4": 0.007457437667308825, "3": 9.755004788683409e-05, "2": 4.323483996792927e-06, "1": 2.2251015565376286e-06}, "score": 4.992325575808169}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.942085873248128, "4": 0.057057713834008435, "3": 0.000797583920001049, "2": 4.5623574061344535e-05, "1": 1.0023111315269774e-05}, "score": 4.941169967942998}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5940733811262563, "3": 0.23196898537053262, "1": 0.15246942421312326, "4": 0.0166498412023094, "5": 0.004821124882673705}, "score": 2.127264812663317}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5729809722851541, "5": 0.3543200777261928, "3": 0.06645880479780833, "2": 0.006118556966795323, "1": 8.457337983740477e-05}, "score": 4.275380632026476}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5439591102134682, "5": 0.41346093623366786, "3": 0.0413105980728891, "2": 0.001148583310428096, "1": 0}, "score": 4.369897844905163}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8550486851248507, "4": 0.13527079780872026, "3": 0.008795355332148858, "2": 0.0007635064388559658, "1": 9.04109653321616e-05}, "score": 4.8444814692767775}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9013198949928158, "4": 0.09323831841447539, "3": 0.0052855388842745245, "2": 0.00010532065544380454, "1": 0}, "score": 4.895869338782942}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6963182760493658, "3": 0.2769197294970089, "1": 0.020279470704162934, "4": 0.006353687029586633, "5": 0.00012852424427814}, "score": 2.2697332898699245}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4280951906793668, "4": 0.2533189277832946, "5": 0.1657324728503695, "2": 0.1459590902945663, "1": 0.006891158953822551}, "score": 3.425043808181628}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9953649143188793, "4": 0.004589163571255278, "3": 4.0773711915962905e-05, "2": 3.0191932228883805e-07, "1": 0}, "score": 4.995328360605947}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7775449446310996, "4": 0.20100610464823676, "3": 0.020803635997080027, "2": 0.0004189864405590614, "1": 0.00022268173571919655}, "score": 4.755238044557}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5367148130167304, "3": 0.3774798459236442, "5": 0.06281234803970792, "2": 0.02217945874939302, "1": 0.0008134020859597763}, "score": 3.638533330579084}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5077949117230227, "4": 0.46104216774773815, "3": 0.029806818586996266, "2": 0.001233937997375414, "1": 9.407558528800073e-05}, "score": 4.475251339415924}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9106632816881359, "4": 0.08775097549024528, "3": 0.0015300803937860936, "2": 3.4464836003053006e-05, "1": 0}, "score": 4.909083542004207}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5211236673710443, "5": 0.4604807345965635, "3": 0.01827997098886114, "2": 8.555423975996576e-05, "1": 0}, "score": 4.442042948599034}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7309129571415222, "4": 0.2682004849421271, "3": 0.0008597754564153332, "2": 1.3649399909140814e-05, "1": 0}, "score": 4.730035470484944}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7101857382428303, "4": 0.2815859075956594, "3": 0.008105106369052388, "2": 0.0001094509559399713, "1": 7.842687413533065e-06}, "score": 4.70184238077384}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7626764099103946, "3": 0.21996019078074414, "1": 0.010324041266408924, "4": 0.00625793199928588, "5": 0.0007635953161780088}, "score": 2.2244468015110823}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8636981453754377, "1": 0.08708702264214134, "3": 0.04175485278786882, "4": 0.006011239572728892, "5": 0.0013928378422080128}, "score": 1.9708671942421225}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6868152264965001, "4": 0.2906655748495122, "3": 0.01936548347292381, "2": 0.0026972846424413756, "1": 0.00025421148989857294}, "score": 4.66142629226462}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.974922027477651, "4": 0.024486055175110665, "3": 0.0005028861778760108, "2": 5.498814177877301e-05, "1": 2.0806731371126015e-05}, "score": 4.974259640411293}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6286124555926969, "3": 0.3054627008403369, "4": 0.034838238081157706, "1": 0.024352063249601433, "5": 0.0066983811579233304}, "score": 2.3708956692141503}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9370118032232018, "1": 0.04984760638879632, "3": 0.012894608509214573, "4": 0.000220512538665051, "5": 2.4058119722346094e-05}, "score": 1.9635601501322562}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6111258788493054, "5": 0.34948850768819123, "3": 0.03792256353914307, "2": 0.0014190205484099832, "1": 3.3169857535332166e-05}, "score": 4.308631745071432}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.981515104680432, "4": 0.018353121682735167, "3": 0.00011051017055724122, "2": 2.3854542274418843e-06, "1": 0}, "score": 4.981418350828871}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986273780085025, "4": 0.001364920628028966, "3": 5.54770072405107e-06, "1": 0, "2": 0}, "score": 4.998623981007043}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9654941009226712, "4": 0.03420927749217737, "3": 0.000261319698957371, "2": 1.8321212800661552e-05, "1": 0}, "score": 4.965212528756819}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.82381087174399, "3": 0.16671196769344288, "4": 0.0062930652866728404, "1": 0.0030349953093221256, "5": 0.00014520514824054997}, "score": 2.176699406614276}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9209770846324936, "4": 0.07746632911976432, "3": 0.0015054321185993577, "2": 4.035654381763862e-05, "1": 7.41994435603323e-06}, "score": 4.9193717849009975}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6070888518314121, "4": 0.382926313983169, "3": 0.009790578825795466, "2": 0.0001698148214848077, "1": 0}, "score": 4.596973233709733}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9958593200532486, "4": 0.00409896121323179, "3": 3.6810074009279175e-05, "2": 1.0060618571061097e-06, "1": 0}, "score": 4.99582438415743}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.894958366201412, "4": 0.10324998421730894, "3": 0.001688752818002361, "2": 6.415195448157696e-05, "1": 0}, "score": 4.89317591540451}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6676690916260071, "3": 0.213922709448408, "2": 0.08736256553752784, "5": 0.029919513082167837, "1": 0.0010747634372403273}, "score": 3.6380287925392265}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9564876001117755, "4": 0.04294236977505192, "3": 0.0005518017636555429, "2": 9.935265088814034e-06, "1": 0}, "score": 4.955923855375181}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5451428274158218, "3": 0.3150101873140275, "5": 0.0932438942326319, "2": 0.04563305202093875, "1": 0.0007616232858853644}, "score": 3.6846170022411444}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7728525027889797, "4": 0.21155791250215766, "3": 0.01417952863454688, "2": 0.001319963360455208, "1": 6.85915643124524e-05}, "score": 4.755843524245235}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7395468834428486, "5": 0.2192614775401774, "3": 0.03907087400236086, "2": 0.0020598040954479158, "1": 5.040818476201697e-05}, "score": 4.175921627246843}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6228980233682931, "4": 0.23230360978554776, "3": 0.08922325206420903, "2": 0.04280970284934163, "1": 0.012748910015659169}, "score": 4.409815398298091}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6142261107960937, "4": 0.33684365096803126, "3": 0.04386660300560897, "2": 0.004878397959513443, "1": 0.00017415131677964502}, "score": 4.560086467013914}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7536496681872706, "4": 0.24202532730902315, "3": 0.00423716019271811, "2": 6.83722170042013e-05, "1": 0}, "score": 4.749290353812735}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995552481314467, "4": 0.00044083187104747735, "3": 3.3798051434433323e-06, "2": 1.755010168570519e-07, "1": 0}, "score": 4.99955188185219}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.872054418921784, "4": 0.1262867328345974, "3": 0.0015295908463918422, "2": 6.264040755481314e-05, "1": 0}, "score": 4.870457534520869}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7833642838458642, "3": 0.19267672393222335, "1": 0.01292598050943486, "4": 0.01063643401723121, "5": 0.0003899907254581071}, "score": 2.202194915485425}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9887776081643298, "4": 0.011038280522908351, "3": 0.00017664596962768686, "2": 4.3422973786015886e-06, "1": 2.1176427463760213e-06}, "score": 4.988586918599969}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.897636797160452, "4": 0.10031463323398052, "3": 0.001973571368697358, "2": 3.385577390119306e-05, "1": 0}, "score": 4.895632362765271}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9480163879589519, "4": 0.051459427362920744, "3": 0.0005021175511738948, "2": 9.391805539512356e-06, "1": 0}, "score": 4.947507496758762}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9613887704543002, "4": 0.038340193286407455, "3": 0.0002684483573851651, "2": 1.8138969791016879e-06, "1": 5.08975986147994e-07}, "score": 4.961115422098402}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9157577631416378, "3": 0.0810248970946308, "1": 0.003016295066203421, "4": 0.0001918996459353505, "5": 8.993270342923219e-06}, "score": 2.0784193930339208}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9709717284753618, "4": 0.027159287773419635, "3": 0.0013914475094332318, "1": 0.00019345183329908094, "2": 0.00016558117500184248}, "score": 4.9687835671012754}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9299098955816285, "4": 0.06877705448928072, "3": 0.0012558476701739368, "2": 3.913654002023722e-05, "1": 0}, "score": 4.928592550523401}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5921096332163965, "4": 0.36525464905991, "3": 0.0406394178651014, "2": 0.0018998354534640696, "1": 8.911810905276733e-05}, "score": 4.547407211532658}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9923811377956969, "4": 0.007444245210903303, "3": 0.000169120344302008, "2": 3.3620404214945242e-06, "1": 1.199328189528479e-06}, "score": 4.992202623373735}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7929714266211907, "3": 0.15956005615634308, "1": 0.041631899111300066, "4": 0.004826141460720112, "5": 0.0006354231519380573}, "score": 2.129535292086775}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9499794767898615, "4": 0.048826455115044645, "3": 0.0011221737797076391, "2": 2.736437699821794e-05, "1": 0}, "score": 4.948844826257811}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8500707735193517, "4": 0.14622211174159191, "3": 0.003606659432537016, "2": 3.238818053576265e-05, "1": 0}, "score": 4.846456953617844}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8715464992706771, "4": 0.12375455130344286, "3": 0.004548403439563721, "2": 0.00013481474246482134, "1": 1.3774823721423887e-05}, "score": 4.866688837482508}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9909189490799164, "4": 0.008967512093200555, "3": 0.00010224067144654024, "2": 2.9514204353195634e-06, "1": 0}, "score": 4.990819075671858}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5143765470112706, "3": 0.36476983986808453, "2": 0.0683477592374934, "5": 0.050905311968327635, "1": 0.0015590073100223674}, "score": 3.5447440228180938}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.632546906914891, "5": 0.33163938173543955, "3": 0.0307792105207127, "2": 0.0045817924169670315, "1": 0.0004397272102594719}, "score": 4.290381174246616}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9989314398174595, "4": 0.0010633170121994728, "3": 4.3703432719857425e-06, "2": 2.3247689341944575e-07, "1": 0}, "score": 4.998927244183638}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963668663590874, "4": 0.003616977307057229, "3": 1.5021095172581776e-05, "2": 3.8492551073054173e-07, "1": 0}, "score": 4.996351822988791}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4987334970235962, "4": 0.4681817517574627, "3": 0.03147067245518066, "2": 0.0014765002314861269, "1": 0.00012151996350472488}, "score": 4.463952714631503}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.35804668358768493, "2": 0.34061989528370246, "4": 0.26446520141167623, "5": 0.0231749181351574, "1": 0.013677206374941396}, "score": 2.942839809643319}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7853478958091417, "3": 0.1817488481754762, "1": 0.018678775494805244, "4": 0.013018758500660583, "5": 0.0011997740878936043}, "score": 2.192708058160103}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9129302571214043, "4": 0.08506164925765342, "3": 0.0019013572608859546, "2": 7.605399571560992e-05, "1": 0}, "score": 4.910904740580218}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.996732213773598, "4": 0.0032214964221576226, "3": 4.218942334376541e-05, "2": 2.0274575262598946e-06, "1": 0}, "score": 4.9966880354931265}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999803763825457, "4": 1.9374767166693227e-05, "3": 6.534264180014418e-08, "1": 2.1489186109427496e-08, "2": 0}, "score": 4.999980408587631}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9630614868010617, "1": 0.030645198029991758, "3": 0.0062644110590060875, "4": 2.616512868345223e-05, "5": 1.3593226958849327e-06}, "score": 1.9756755876950853}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5826800922973293, "4": 0.38626462013667273, "3": 0.028934778473224558, "2": 0.001823285838336421, "1": 0.00019055837116816536}, "score": 4.549585688527239}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8001687948561781, "5": 0.10768900383348416, "3": 0.0899034286270394, "2": 0.0021085621695702177, "1": 0}, "score": 4.013570217852343}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.953760367684585, "4": 0.04561767627336668, "3": 0.0005741662324501717, "2": 2.5464607781610114e-05, "1": 0}, "score": 4.95315655164895}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6711223626446018, "4": 0.30497923093146145, "3": 0.022413883791607723, "2": 0.0012064380754420877, "1": 0.00021994588921020662}, "score": 4.645673303620105}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"5": 0.47522583301784227, "4": 0.1916672084809043, "3": 0.16793764990215873, "2": 0.1473816055138921, "1": 0.017724856544426466}, "score": 3.959347847607467}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8555674037786704, "4": 0.14135514450460884, "3": 0.0029154910998727517, "2": 0.00013283895873185996, "1": 2.2474460103192927e-05}, "score": 4.852324476950593}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9966374809719647, "4": 0.0033375622624968898, "3": 2.2958943554641923e-05, "2": 4.211696985663979e-07, "1": 0}, "score": 4.996615251004725}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9723664396908046, "4": 0.027004563736055264, "3": 0.0005972253769402638, "2": 2.4091656035738646e-05, "1": 3.8325621874177225e-06}, "score": 4.971713271474786}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6565466691183144, "4": 0.2965701188412448, "3": 0.04316622578662805, "2": 0.0031556745574320534, "1": 0.0005559397682875114}, "score": 4.6054045271015465}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8336901153492137, "5": 0.11042802806060427, "3": 0.050244434218419155, "2": 0.005549069627282161, "1": 5.725406005804706e-05}, "score": 4.0489152136062385}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8743716630087337, "4": 0.1248534037391025, "3": 0.0007091869393258502, "2": 4.115447040192252e-05, "1": 0}, "score": 4.873601650602748}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5883859905127382, "4": 0.3960511933289033, "3": 0.014921050169318543, "2": 0.0005986592419111584, "1": 0}, "score": 4.572292291518692}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8540567119182685, "4": 0.14230261462804517, "3": 0.003279328510346246, "2": 0.00030641627643027624, "1": 3.6869054138763556e-05}, "score": 4.8500692956149525}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969500605440064, "4": 0.0030296799260730914, "3": 1.8154174930242305e-05, "2": 6.370224109296175e-07, "1": 0}, "score": 4.996932096152131}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7780908561020625, "1": 0.16975166568740285, "3": 0.04190987498454899, "4": 0.008662952319621432, "5": 0.0015687408308151045}, "score": 1.8941886529623086}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8665751199906642, "4": 0.130627789691651, "3": 0.002556492697225579, "2": 0.0001886970007486254, "1": 0}, "score": 4.863686059133645}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7005119879027307, "4": 0.289555960537958, "3": 0.0096531914316576, "2": 0.00022830924734831026, "1": 0}, "score": 4.690437080178576}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9823997264893262, "4": 0.017364506715737065, "3": 0.0002178192429279868, "2": 1.0343968104270527e-05, "1": 4.652159674768416e-06}, "score": 4.982150161572949}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.975369561855946, "4": 0.024455280867063296, "3": 0.00016886178802121878, "2": 5.285459490696815e-06, "1": 5.240865471222392e-07}, "score": 4.975189030775518}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3646309254940009, "4": 0.2784594309678492, "2": 0.22075102417157427, "5": 0.12721936488518404, "1": 0.008853853420340894}, "score": 3.2944645773133057}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9414717035343905, "4": 0.05786842383921379, "3": 0.0006398046260579027, "2": 1.7734547226595374e-05, "1": 1.4062626155164508e-06}, "score": 4.940793083320439}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9722285066545993, "4": 0.025973382898707348, "3": 0.0017715340727541414, "2": 2.2013580491191944e-05, "1": 0}, "score": 4.970417373234896}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8154374999642595, "4": 0.17490094393042804, "3": 0.008886482296014443, "2": 0.0005877422832129506, "1": 0.0001666942936578643}, "score": 4.804892060965386}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.56698620803698, "5": 0.26811156440516015, "3": 0.1212796067002795, "2": 0.04160931577025678, "1": 0.0019855784434782762}, "score": 4.057658189502018}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.445026209854905, "2": 0.442566359856719, "4": 0.09499148718268526, "5": 0.011836155578663738, "1": 0.005576094265998152}, "score": 2.664944012502077}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.978131333627952, "4": 0.02127576175485748, "3": 0.0005606993579061544, "2": 2.5151324469549838e-05, "1": 6.412470165704012e-06}, "score": 4.977501721243407}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8527930970985086, "4": 0.14346020490174727, "3": 0.0035760283280072327, "2": 0.00014853484214546472, "1": 1.8847712579523133e-05}, "score": 4.84886624627115}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9889851120615304, "4": 0.010713557322986803, "3": 0.00028688761622216313, "2": 1.0781989012444577e-05, "1": 3.323124842775679e-06}, "score": 4.988667025148913}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.762342270697727, "4": 0.22803209326482574, "3": 0.008714505002146553, "2": 0.0007391867223403719, "1": 0.00016409959957486482}, "score": 4.751662990032894}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8475227130734339, "4": 0.14112881840195599, "3": 0.009783333542463255, "2": 0.0011770080633062244, "1": 0.00038430109925078503}, "score": 4.834235651741705}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6195343075669982, "5": 0.3464458325464007, "3": 0.03113976995647523, "2": 0.002775136344049261, "1": 8.105067351067717e-05}, "score": 4.3095200363116595}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9713076534602356, "4": 0.028250692737752072, "3": 0.0004127204791797046, "2": 1.6705175105326283e-05, "1": 0}, "score": 4.970873394614138}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6529119225783543, "4": 0.33692015684808, "3": 0.00972727386846283, "2": 0.00040669892023371365, "1": 2.8653269575670948e-05}, "score": 4.642288691667997}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9753661597728475, "4": 0.024096448849159124, "3": 0.0005086949670160544, "2": 2.1809432462127917e-05, "1": 5.418773823140017e-06}, "score": 4.974799020823934}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8005350999290665, "3": 0.15499024492673333, "1": 0.03740205610512196, "4": 0.005837772360678402, "5": 0.0008228493696336855}, "score": 2.1317865747302576}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995880006955007, "4": 0.004061682428291563, "3": 3.459798896460597e-05, "2": 1.210738565323061e-06, "1": 0}, "score": 4.99586539634169}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5491662005746079, "5": 0.41152697835727825, "3": 0.03808577980435231, "2": 0.001140910101986273, "1": 0}, "score": 4.37118912216455}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9076098076479774, "4": 0.08950989510322886, "3": 0.002803357704681248, "2": 6.630581216395958e-05, "1": 7.448774766279974e-06}, "score": 4.9046543732801124}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9867930532750713, "4": 0.012980272163679698, "3": 0.0001969942534413943, "2": 5.852298897400027e-06, "1": 0}, "score": 4.986607863324793}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7343427334828087, "1": 0.16533957328406945, "3": 0.08234792664732263, "4": 0.011589392950595488, "5": 0.006347738952234159}, "score": 1.9592290255733218}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4284425038473971, "2": 0.3098246148974306, "4": 0.23441721057966675, "5": 0.01894742955859505, "1": 0.008358958842601443}, "score": 2.9457690337275184}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.5694943939236385, "3": 0.40065955592017327, "4": 0.025423338201243654, "1": 0.0038495751015757145, "5": 0.0005703969705361776}, "score": 2.4493690793513196}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.933611671949302, "4": 0.06485044540557608, "3": 0.0014928016836870685, "2": 3.76289634341735e-05, "1": 5.833683143755216e-06}, "score": 4.932027619603459}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4617365909298135, "3": 0.3599872013390267, "1": 0.13833682593712698, "4": 0.029280585309800815, "5": 0.010644382401794114}, "score": 2.312149192571078}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5576996629187648, "4": 0.38186344809559475, "3": 0.05678784344596761, "2": 0.003367911700961219, "1": 0}, "score": 4.494314964734443}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5451879943700885, "4": 0.3975313261771925, "3": 0.05621774076057665, "2": 0.0009806548452631456, "1": 0}, "score": 4.487049020185986}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6261418913925311, "3": 0.2694528655089158, "5": 0.0955201747385108, "2": 0.008747649003756006, "1": 8.541208129676945e-05}, "score": 3.8083058054855043}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983631713675842, "4": 0.0016289738537209034, "3": 6.398557395242381e-06, "2": 1.0808358218662839e-07, "1": 0}, "score": 4.998357902566968}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8979416863840276, "4": 0.09866527679130645, "3": 0.003239971971457628, "2": 0.00012982748853981538, "1": 0}, "score": 4.894462844394788}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3557177854544956, "3": 0.31663490122762494, "2": 0.2989434063284455, "5": 0.024374757764847915, "1": 0.004323707617568857}, "score": 3.0968770065872073}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7457701396886542, "3": 0.20062983213094845, "5": 0.03325645817212568, "2": 0.020277412442345006, "1": 5.546596325646491e-05}, "score": 3.7919031783781842}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5415742786100062, "5": 0.44971276500807006, "3": 0.00860721047225384, "2": 9.501478945563515e-05, "1": 0}, "score": 4.440920256525183}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7390520851024844, "5": 0.24578900852454086, "3": 0.014568013643766297, "2": 0.0005472772655286223, "1": 0}, "score": 4.230136477858909}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9952703133610256, "4": 0.004700800338385763, "3": 2.776939619361177e-05, "2": 7.593257260719869e-07, "1": 1.7995770246056644e-07}, "score": 4.995240662215881}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3892993243181639, "4": 0.30657504762153925, "3": 0.15832112054350214, "2": 0.12158410906754852, "1": 0.024148121176126112}, "score": 3.915359504526978}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9525390704284598, "4": 0.043113013072808515, "3": 0.003516344230293423, "2": 0.0006017477021023202, "1": 0.00020128293557994528}, "score": 4.947242417830548}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9949525329891822, "4": 0.004999019928806692, "3": 4.046063628805354e-05, "1": 1.486656379861533e-06, "2": 0}, "score": 4.994914079115683}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998014858765367, "4": 0.00019737422735506104, "3": 1.0412933621611732e-06, "1": 3.085891961066403e-08, "2": 0}, "score": 4.999800419736722}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992515241978611, "4": 0.000739126111514218, "3": 3.950880865456032e-06, "1": 2.2180416145732446e-07, "2": 0}, "score": 4.9992520810381285}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7518983327374019, "3": 0.17485320248973818, "1": 0.043572245605683374, "4": 0.02600279621532818, "5": 0.0036575637327487774}, "score": 2.194262321361675}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.741837197697398, "4": 0.24260739516046345, "3": 0.01277787652425236, "2": 0.002495470476050428, "1": 0.0002601878988701055}, "score": 4.723303636797316}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9972820400595924, "4": 0.0026902961459413367, "3": 2.4824090131594515e-05, "2": 6.083350729245605e-07, "1": 0}, "score": 4.997258224550664}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8617679793820702, "4": 0.13009188116296133, "3": 0.007058332113033214, "2": 0.0009072135400526839, "1": 0.000160525299264494}, "score": 4.852425636643439}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830361247685435, "4": 0.016866649654227052, "3": 9.33784469561129e-05, "2": 2.313493125674827e-06, "1": 0}, "score": 4.982939626808062}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5885832682131922, "5": 0.3697965091152428, "3": 0.035862948200657996, "2": 0.005198842366529093, "1": 0.00048625445554453735}, "score": 4.322100361261657}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7363790715319338, "5": 0.15106772995259746, "3": 0.10479655288026965, "2": 0.007528754167964908, "1": 0.000158160692600275}, "score": 4.03074133027537}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6380993415499499, "5": 0.32788763680670796, "3": 0.03183339445859875, "2": 0.0019115105225073138, "1": 0.00013522019962566886}, "score": 4.291864348443689}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8292600515286812, "4": 0.16833626881870092, "3": 0.002290818732966618, "2": 9.022292551970988e-05, "1": 1.4201286483942797e-05}, "score": 4.826753158159915}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9669594869610735, "4": 0.03269157760012812, "3": 0.00031947644865293047, "2": 1.3137234911062351e-05, "1": 0}, "score": 4.966629513132915}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.830024367656633, "3": 0.09705757692783791, "1": 0.05123567562658955, "4": 0.019924714164094495, "5": 0.001704435513825357}, "score": 2.090789468904423}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9284323075655198, "3": 0.05994634900681982, "1": 0.006689497632255907, "4": 0.0045160615656690125, "5": 0.00040977788047794007}, "score": 2.06351868966277}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9655169949902233, "4": 0.034025535232587466, "3": 0.0003655414057372094, "2": 5.717019241638889e-06, "1": 0}, "score": 4.965223232746083}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9299096854220158, "4": 0.0671373203235436, "3": 0.0024504588162988297, "2": 0.00017155408099313178, "1": 0}, "score": 4.927423078192803}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6810611720963018, "5": 0.19744620726863651, "3": 0.10850345100605716, "2": 0.011831110900890018, "1": 0.0011055201840348733}, "score": 4.061967229576718}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6590314643631949, "3": 0.20004436740725945, "1": 0.06898476471478907, "4": 0.0524070214235109, "5": 0.019399569575284336}, "score": 2.2941114159424694}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.421836196606432, "4": 0.34877659175273085, "3": 0.176080746891377, "2": 0.0473166138958972, "1": 0.005674916099233469}, "score": 4.134139718884974}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9771555477907867, "4": 0.02256831607342749, "3": 0.00021535644906761866, "2": 7.983281623658221e-06, "1": 0}, "score": 4.9769758055888715}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8903793509915584, "4": 0.10759210581257601, "3": 0.00193359096735372, "2": 6.826837017793678e-05, "1": 0}, "score": 4.888332927433837}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7275485112711424, "5": 0.131151517764355, "3": 0.12589523325585805, "2": 0.014055394594374302, "1": 0.0010573784442355928}, "score": 3.973965758908432}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9388042574726, "1": 0.032158753331195215, "3": 0.02707000474688537, "4": 0.0013719578112074873, "5": 0.0005893619776536731}, "score": 1.9994232497039717}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6740911566228494, "2": 0.23883512945799293, "5": 0.06098249031684399, "3": 0.017921309487964023, "4": 0.007654473735864481}, "score": 1.541850422495744}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.4393885225963981, "4": 0.4313307162648343, "3": 0.11435232801969868, "2": 0.01381104561623865, "1": 0.0009800744694029545}, "score": 4.294514320590761}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9681600794938062, "4": 0.030896465090133104, "3": 0.0006823921946079554, "2": 0.00011169149457985461, "1": 0}, "score": 4.9673988063403165}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5341685249585034, "1": 0.26393624532011456, "3": 0.10094593525167685, "5": 0.07626458523623166, "4": 0.024577725836881892}, "score": 2.114971197323221}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7482370570700023, "2": 0.20731593359504213, "3": 0.030098760123079094, "4": 0.008841588711363342, "5": 0.00538448504831606}, "score": 1.3156147205397568}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7229604796034633, "1": 0.15483765469850513, "3": 0.10560600962516883, "4": 0.013998417380596042, "5": 0.002585369865049063}, "score": 1.986521136608929}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9940180691216396, "4": 0.005880701038168048, "3": 9.61806850074368e-05, "2": 1.3553077603676112e-06, "1": 0}, "score": 4.993922849220469}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972576168217682, "4": 0.0027079448221703044, "3": 2.7195120340571133e-05, "1": 1.2371490236290556e-06, "2": 0}, "score": 4.997232699720408}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9767792658677958, "4": 0.023085893938298102, "3": 0.00011976129555307089, "2": 8.248584071866006e-06, "1": 0}, "score": 4.976649678228345}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6296817789416692, "5": 0.30408971681913805, "3": 0.06444074239646798, "2": 0.001700936325223691, "1": 0}, "score": 4.2362676158302355}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8689676335826195, "4": 0.12164046420016618, "3": 0.008346193602844908, "2": 0.000764861642478515, "1": 0.0002272999607011466}, "score": 4.858455784554216}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8389830041421742, "4": 0.15763393517861463, "3": 0.003318370267033817, "2": 3.1073723482854496e-05, "1": 0}, "score": 4.835630577561164}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9498196324426856, "4": 0.04926215695985515, "3": 0.0008910182037556326, "2": 1.7945287721036156e-05, "1": 0}, "score": 4.94890149825621}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6854457653716817, "4": 0.2928863878322949, "3": 0.01979549682953873, "2": 0.001652820593353354, "1": 0.0001964870563140258}, "score": 4.661770414910054}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7015292247056326, "4": 0.2717890405016124, "3": 0.022743706709673975, "2": 0.0031043988171750568, "1": 0.0006650442354812956}, "score": 4.670694656734277}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5493700339705886, "4": 0.27924107560102496, "3": 0.11492908419560567, "2": 0.04950369330344676, "1": 0.006896267194976943}, "score": 4.314763598841881}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9431819470974351, "4": 0.055981936655711564, "3": 0.0007831585437742289, "2": 3.3340389434866254e-05, "1": 0}, "score": 4.942350594161959}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987063137344926, "4": 0.00127811582147621, "3": 1.3576095440054638e-05, "1": 1.1589559514271865e-06, "2": 4.997529303256503e-07}, "score": 4.998688596464888}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975901544511756, "4": 0.0023817701672614695, "3": 2.417290935481166e-05, "1": 1.1160610401790036e-06, "2": 0}, "score": 4.997565412986108}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.4848936793070613, "4": 0.24486985834441183, "3": 0.2044189325381474, "2": 0.04992475035966103, "1": 0.015836540804489086}, "score": 4.133123110299629}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6124524329921263, "5": 0.1767796919344839, "3": 0.14474285857724875, "2": 0.06179648457723202, "1": 0.004186016974089981}, "score": 3.895881386683402}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5292941036934029, "3": 0.38518975345349027, "2": 0.05488962106382043, "5": 0.03012439410712909, "1": 0.00048511528220684073}, "score": 3.5336921196632165}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9160436615466746, "4": 0.08192538377014429, "3": 0.0019180542850032655, "2": 6.971228502431208e-05, "1": 0}, "score": 4.914025657735156}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7370056651880674, "5": 0.20973234684781505, "3": 0.05069370184834234, "2": 0.002459994905438424, "1": 0.00010546957871946286}, "score": 4.153802680426944}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6850237704055623, "5": 0.2354472928803493, "3": 0.07241006282159698, "2": 0.006683509868547568, "1": 0}, "score": 4.14973539972781}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7329906301908777, "5": 0.23320345710037735, "3": 0.03224413863533591, "2": 0.0015224775560493192, "1": 3.289216744884943e-05}, "score": 4.197816953739586}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8904306694843093, "4": 0.10835496806971959, "3": 0.0012093478882281238, "2": 2.417842365494393e-06, "1": 0}, "score": 4.8892187949594685}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943027210012345, "4": 0.005657382214659231, "3": 3.5710242698765926e-05, "2": 1.2741554385190425e-06, "1": 0}, "score": 4.994267358137962}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8961018827904862, "4": 0.10167589750838743, "3": 0.002139942113672444, "2": 6.800971468346367e-05, "1": 1.1949656795990211e-05}, "score": 4.893792144280286}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"2": 0.878520988806079, "3": 0.11168503017691324, "1": 0.00515284340083413, "4": 0.00444645335256713, "5": 0.0001933524246069879}, "score": 2.1160053052554244}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5701056981463932, "3": 0.30789172500671264, "4": 0.0835365097644527, "1": 0.022104678412254667, "5": 0.016224683881539505}, "score": 2.5016026892576018}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.662190367622103, "3": 0.2439060911761875, "5": 0.07100862006103383, "2": 0.022588485357445356, "1": 0.00025197290401095414}, "score": 3.7811577206772964}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.536385961294737, "5": 0.3989154656810334, "3": 0.0500809090699407, "2": 0.010796456505840924, "1": 0.003775109085037406}, "score": 4.315930880240829}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7433681096558886, "4": 0.2101923531764525, "3": 0.03871303166884689, "2": 0.005483306412639199, "1": 0.0021422780645479595}, "score": 4.687330997114543}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9518227057407268, "3": 0.02882930426357157, "1": 0.01864828116265298, "4": 0.0006417780696120611, "5": 5.6992037093655546e-05}, "score": 2.011635566274036}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8689236214865943, "3": 0.09273557640924902, "5": 0.02866257253909274, "2": 0.009594828726196797, "1": 4.3677869626679893e-05}, "score": 3.916602992291798}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.869416597376046, "3": 0.09028280116397705, "5": 0.03285123301673226, "2": 0.007250634476098898, "1": 0}, "score": 3.9280528645609074}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7325610183929175, "5": 0.22658346568923163, "3": 0.039529533614906444, "2": 0.0012528445161921933, "1": 6.388998104703572e-05}, "score": 4.184358278008334}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7274383396669999, "3": 0.1491547084447065, "5": 0.07436780197261375, "2": 0.04743000185416426, "1": 0.001426550480891928}, "score": 3.8260416740074477}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9807366264787265, "2": 0.019104258703762894, "3": 0.00011473321433828571, "5": 2.058043054947238e-06, "4": 0}, "score": 1.0193427759598004}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5627298309485922, "3": 0.2745415124885748, "5": 0.11768849711918994, "2": 0.04300736065132739, "1": 0.0020003974363280615}, "score": 3.751123007066931}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7864717152031256, "4": 0.20352722485019498, "3": 0.009597304511370714, "2": 0.00031643174349545324, "1": 0}, "score": 4.776309337402095}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5419792567249806, "4": 0.4095266493617542, "3": 0.04422195914650471, "2": 0.003896421933160235, "1": 0.0003460500985122829}, "score": 4.488940806738242}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.33172346297555644, "2": 0.32733701889690064, "3": 0.2290268576478288, "4": 0.07451527060777798, "5": 0.03707048049776278}, "score": 2.1575968972841797}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3771227302811158, "1": 0.24153352394892355, "3": 0.1410167219846584, "4": 0.124551997458487, "5": 0.11563116102830451}, "score": 2.495551968769537}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7992268149267564, "4": 0.1975589417351013, "3": 0.0030130946664339068, "2": 0.00010531833841487205, "1": 0}, "score": 4.796079372135052}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8051377324400815, "4": 0.1935524971901731, "3": 0.0012736028565277278, "2": 2.863632617822072e-05, "1": 0}, "score": 4.803812910596571}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985801786014882, "4": 0.001404251722386326, "3": 1.1658838454168153e-05, "2": 5.542632957578789e-07, "1": 0}, "score": 4.998570763013478}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9822324744035199, "4": 0.017486106983582307, "3": 0.00020145107702043664, "2": 1.0631502822659957e-05, "1": 0}, "score": 4.98207785370338}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5253281048387849, "4": 0.3266025796425768, "2": 0.13535925323775483, "5": 0.012089192588519267, "1": 0.0005349442618252239}, "score": 3.2143702429136276}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7144828819369891, "2": 0.25225018155660395, "4": 0.031189268552000902, "5": 0.001627517225358378, "1": 0.00044586274497534177}, "score": 2.781301458180299}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.953497366381013, "4": 0.04592351425296618, "3": 0.0005420405737549343, "2": 1.73845096196061e-05, "1": 0}, "score": 4.952939324244416}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9973352721072143, "4": 0.0026466277408149696, "3": 1.6699446212826373e-05, "2": 3.62741999703035e-07, "1": 0}, "score": 4.997318882357858}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8785496993411207, "4": 0.11887769351412361, "3": 0.0024778860041530784, "2": 6.666489869573319e-05, "1": 0}, "score": 4.875963059771082}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6442165832646248, "5": 0.2659990078751667, "3": 0.07818483312888988, "2": 0.011177690576391633, "1": 0.00039047434057437684}, "score": 4.164292531133965}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9237417340630795, "4": 0.06378597119728599, "3": 0.007012425724928279, "1": 0.0037870785055603186, "2": 0.0014982118230177767}, "score": 4.9025292115393775}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7691733209664507, "4": 0.22664583003993036, "3": 0.003914562521391308, "2": 0.00014981445443211736, "1": 0}, "score": 4.765048236247982}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6877936867017503, "4": 0.28398777145642184, "3": 0.025821339926579687, "2": 0.002050618139130645, "1": 0.0003022089174871352}, "score": 4.656993637744245}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5271634113722292, "4": 0.45153327954191924, "3": 0.019924538827381325, "2": 0.0012036440684643494, "1": 9.770449419741126e-05}, "score": 4.504577536173844}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4933660576587339, "3": 0.45289101383755404, "2": 0.03867866201993922, "5": 0.014878570838345496, "1": 0.00018220374846437796}, "score": 3.4840818201823955}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8291497341099032, "4": 0.17031609263098305, "3": 0.0005191410183750638, "2": 9.72656262630023e-06, "1": 0}, "score": 4.82861553633359}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9817185349494424, "4": 0.01816802678290162, "3": 9.072224244329822e-05, "2": 1.4997786911116458e-06, "1": 0}, "score": 4.981645639985511}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996672120162093, "4": 0.0003296899139344862, "3": 1.7194243558278137e-06, "1": 1.50538345174063e-07, "2": 0}, "score": 4.999666268674116}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984323268852465, "4": 0.0015572777719794371, "3": 9.227023892128127e-06, "2": 2.724452937168178e-07, "1": 0}, "score": 4.998423449431965}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8108964377497695, "2": 0.16668299567119943, "3": 0.015764317169343477, "5": 0.0035432237584945014, "4": 0.0030410391387943538}, "score": 1.221523589170846}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6285737342580617, "4": 0.3545475533411941, "3": 0.014486320335487421, "2": 0.0015999509603297853, "1": 0.0005237476361790859}, "score": 4.609480032397415}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8163895893714976, "4": 0.17970885676736642, "3": 0.003623227774551383, "2": 0.00013622726509935316, "1": 0}, "score": 4.812609377901676}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6366952833178663, "4": 0.3141055823722361, "3": 0.0416384025218444, "2": 0.006238702817637979, "1": 0.001303633908381725}, "score": 4.57867921827572}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.971029611767292, "4": 0.028225755563625242, "3": 0.0007157549487026225, "2": 1.0706944589150007e-05, "1": 0}, "score": 4.970310074216217}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7679489341786774, "3": 0.15217379852257507, "1": 0.061182180509925584, "4": 0.016339877279712423, "5": 0.0023325201184655354}, "score": 2.1306718977932064}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9979559171885547, "4": 0.0020310292392661487, "3": 1.1775941072781471e-05, "1": 2.892611279139555e-07, "2": 0}, "score": 4.997944259802245}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9790786721270066, "4": 0.020570680370527946, "3": 0.0003340382668978309, "2": 8.885462888195102e-06, "1": 0}, "score": 4.978734422456525}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989302489919999, "4": 0.0010646406016646042, "3": 4.677087363530331e-06, "1": 1.0889529638469857e-07, "2": 0}, "score": 4.998925569293853}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944477003100661, "4": 0.005529612158467943, "3": 2.205107950779881e-05, "2": 2.725529308647734e-07, "1": 2.405165343181823e-07}, "score": 4.994424505269668}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7754338963789755, "3": 0.17099875554851884, "1": 0.03478910555427641, "4": 0.015908123313514443, "5": 0.002851407919045716}, "score": 2.1765834244813083}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6673171892505187, "4": 0.31748709726836266, "3": 0.014459730500668396, "2": 0.0006313118512477445, "1": 7.017608320975334e-05}, "score": 4.651406777104462}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.99104503667361, "4": 0.008830529501229594, "3": 9.533409941720608e-05, "2": 2.1393896069791743e-06, "1": 0}, "score": 4.990972140736995}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9923462663336827, "4": 0.007493742050547663, "3": 6.87605760358491e-05, "1": 2.7071097638533203e-06, "2": 0}, "score": 4.992357231790447}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951223801113858, "4": 0.004769020219010254, "3": 8.394967884491304e-05, "1": 7.986355778820222e-06, "2": 0}, "score": 4.995031052199453}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7706847065336854, "2": 0.1381131917441058, "4": 0.09002963365622883, "5": 0.0010609569448042687, "1": 0.00011152096029750832}, "score": 2.953815314335553}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9985438024860197, "4": 0.0014475569580991376, "3": 8.018830256722268e-06, "1": 2.8671160127988286e-07, "2": 2.254800842693411e-07}, "score": 4.998534581934217}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7180469658685499, "4": 0.2790785766708197, "3": 0.0028373663460433034, "2": 3.394445655205125e-05, "1": 2.7645518933821563e-06}, "score": 4.715133690210697}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9425438835011154, "4": 0.04432373352083781, "3": 0.010398294257379911, "1": 0.0014658680300492675, "2": 0.0012636958970250443}, "score": 4.9252247798106925}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9981075480495967, "4": 0.0018737734380374032, "3": 1.7000615647584432e-05, "1": 4.615520522913691e-07, "2": 0}, "score": 4.998090376799699}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5826775926050951, "4": 0.4043625509924746, "3": 0.012279358463669636, "2": 0.000609089462735357, "1": 6.227166817835061e-05}, "score": 4.568998439040822}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.38545831273396414, "2": 0.29921658597793904, "4": 0.28865476203549556, "5": 0.022196554607693066, "1": 0.004383165932762656}, "score": 3.025067224967061}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6708346470661283, "5": 0.3023653876672457, "3": 0.025929447163553873, "2": 0.000682164995837846, "1": 0}, "score": 4.275123430865093}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9793786216099409, "4": 0.020537023445549186, "3": 7.816590522902483e-05, "2": 1.9636658499637973e-06, "1": 0}, "score": 4.979300666284029}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8510574618077578, "4": 0.14358828592985626, "3": 0.0049750492943928274, "2": 0.0003168265800089935, "1": 4.461216403112998e-05}, "score": 4.845329939491613}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7828222267162022, "2": 0.21705042047759712, "3": 0.00012484320100875966, "5": 3.078442080381191e-07, "4": 0}, "score": 1.2173018167031087}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3963493736481825, "3": 0.3699127692215617, "1": 0.1631524074498311, "4": 0.05203496409025897, "5": 0.0185436605066903}, "score": 2.366463772618158}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9901594918008769, "4": 0.009684529147309, "3": 0.00015218540662775582, "2": 1.4920224639937057e-06, "1": 0}, "score": 4.990006600971009}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7859478793587722, "4": 0.209663565918738, "3": 0.004271474479455302, "2": 9.861945533984116e-05, "1": 9.714256589380325e-06}, "score": 4.781456858235586}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990789587191455, "4": 0.0009187710464490118, "3": 2.1623326249562174e-06, "2": 2.4420961391927344e-08, "1": 0}, "score": 4.999076830948351}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9489530573312839, "1": 0.04443521470118283, "3": 0.0065965466614342156, "4": 1.0971440276478494e-05, "5": 2.2274480499630245e-06}, "score": 1.9621898822295047}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5600679854681206, "4": 0.2795418125223759, "2": 0.08537130002083684, "5": 0.07215372980134975, "1": 0.002720844415439846}, "score": 3.3330843565963937}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.609741001306456, "4": 0.18368361225901877, "2": 0.17403556571389617, "5": 0.028978885511187224, "1": 0.003289578953678527}, "score": 3.061043224120877}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4735428377572266, "4": 0.28052472829237096, "2": 0.12753088607429086, "5": 0.10953830210225263, "1": 0.00882588586409558}, "score": 3.3544319162388017}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6331861020300713, "4": 0.31412735064335645, "3": 0.0523432704037758, "2": 0.00030426637703065385, "1": 0}, "score": 4.5802569350119535}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.729277617391303, "3": 0.25033130961833666, "5": 0.01337908516417053, "2": 0.00698950877918859, "1": 1.232889331858446e-05}, "score": 3.749029223915554}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5833734101373712, "3": 0.2540992856384985, "5": 0.07917222785921618, "2": 0.07423737866931042, "1": 0.00900070834268676}, "score": 3.6495550615274515}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5365788964685563, "5": 0.45945949097286976, "3": 0.003936286550412103, "2": 2.003347366915234e-05, "1": 0}, "score": 4.4554855481480935}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7206705506748875, "5": 0.2613852255123801, "3": 0.016545518488857713, "2": 0.0012263021744725433, "1": 0}, "score": 4.242428898180129}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7469936235226572, "4": 0.2514065070266636, "3": 0.0015437372758288932, "2": 4.293526679204186e-05, "1": 0}, "score": 4.745373852343442}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8090874753651462, "3": 0.12663247317385057, "1": 0.05846049804034319, "4": 0.005100266937170053, "5": 0.0006753543782795405}, "score": 2.080402104376395}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.49920317588402036, "5": 0.48689843013637707, "3": 0.01380897687655781, "2": 8.148154541368549e-05, "1": 0}, "score": 4.472930243134193}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5634623118459402, "3": 0.4062408778960569, "5": 0.023593703580117326, "2": 0.00667353216000812, "1": 2.867476758859983e-05}, "score": 3.603919380687626}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9144163829957672, "4": 0.08252476903289191, "3": 0.0029588863930450175, "2": 8.737913795170546e-05, "1": 1.0318150800135244e-05}, "score": 4.911253847216976}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9682500296161299, "4": 0.03146007491742328, "3": 0.0002854119450737735, "2": 3.2237412306087503e-06, "1": 0}, "score": 4.967959389604612}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5329709282099542, "5": 0.4450175586294756, "3": 0.020933465091834216, "2": 0.0009493053987570929, "1": 0}, "score": 4.422239843024888}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9892626948463544, "4": 0.010549410472555478, "3": 0.00015831054171852612, "2": 7.822393312805421e-06, "1": 0}, "score": 4.989110264284405}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9824740576645452, "4": 0.0174739688457421, "3": 4.9739608029902075e-05, "2": 3.678090203232931e-07, "1": 0}, "score": 4.982425415715685}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9250843559556968, "4": 0.07342902393957927, "3": 0.0014340404921496333, "2": 4.6848526556931185e-05, "1": 4.745275815422736e-06}, "score": 4.923543293021386}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989256087719847, "4": 0.0010685072478792013, "3": 4.721863627308382e-06, "2": 1.4674227795963203e-07, "1": 0}, "score": 4.9989216077030605}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6807408558382084, "4": 0.2669915684284967, "3": 0.04177729787621207, "2": 0.00988027730804854, "1": 0.0005940611486765934}, "score": 4.6174306613743745}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9374926698451298, "4": 0.058061516569397634, "3": 0.0034872249581195205, "2": 0.0007804311769903782, "1": 0.00016817944896914318}, "score": 4.931949343177967}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9453757324824525, "4": 0.05371749709992068, "3": 0.0008273790703021636, "2": 5.796651741846759e-05, "1": 0}, "score": 4.9444526551148025}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9010398173075773, "4": 0.09769893702327581, "3": 0.0012220946087425743, "2": 3.0295693023238623e-05, "1": 0}, "score": 4.899765099063297}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9890488967351729, "4": 0.010860846727220026, "3": 8.314042602207305e-05, "2": 2.5712407331783312e-06, "1": 0}, "score": 4.988965108546379}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9157638657717053, "1": 0.06674664801275994, "3": 0.016569990845801064, "4": 0.0008201687878880718, "5": 9.4770156795405e-05}, "score": 1.9517477710215387}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6978001257641309, "3": 0.2914478475012277, "1": 0.006531866120676442, "4": 0.0037829290063582568, "5": 0.0004286610691030727}, "score": 2.2937703403705907}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5882587363860203, "5": 0.3944767404513675, "3": 0.017107190616014446, "2": 0.00014256136776166867, "1": 0}, "score": 4.3770899971636155}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9756294651652927, "4": 0.024233546178319115, "3": 0.00013434223787122648, "2": 1.4009962041489173e-06, "1": 0}, "score": 4.975493535836429}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5121022637500346, "5": 0.47984665253896847, "3": 0.007936913557598893, "2": 9.99307611787602e-05, "1": 8.900776836814142e-06}, "score": 4.471685693276999}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6990856304717005, "1": 0.29969850290019723, "3": 0.001170837469883547, "4": 1.0988613034667292e-05, "5": 0}, "score": 1.7014841501534812}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5301510198029972, "4": 0.3012148444223735, "2": 0.09593730248413787, "3": 0.05822233121416787, "1": 0.014259969540615307}, "score": 4.2373250889518275}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8895314994216454, "4": 0.10830728070953334, "3": 0.0021007412927368995, "2": 3.79649573007535e-05, "1": 0}, "score": 4.887374806232413}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943381967642909, "4": 0.00564354028665565, "3": 1.611189079304186e-05, "2": 3.641940525361499e-07, "1": 0}, "score": 4.99432313320581}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6234315146944777, "4": 0.3665076810612036, "3": 0.00986217447196246, "2": 0.0001880787123584089, "1": 6.176597527516859e-06}, "score": 4.613177335326456}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7183639817595443, "4": 0.18981275362310862, "3": 0.04381572095872394, "2": 0.039848281455832094, "1": 0.008048399718874076}, "score": 4.570769775687612}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9664052879635205, "4": 0.03334013674960781, "3": 0.000246855601894646, "2": 3.690553910244583e-06, "1": 0}, "score": 4.966154944018705}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.973195354025109, "4": 0.02662480443882979, "3": 0.00016123655267974896, "2": 8.366214883003355e-06, "1": 0}, "score": 4.973027347644418}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9679021417977142, "4": 0.03156613532390291, "3": 0.00043508462742176897, "2": 6.195520091393614e-05, "1": 2.1543595029496263e-05}, "score": 4.967291225662925}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9745068215575168, "4": 0.02528616173211044, "3": 0.00018430381381253003, "2": 8.001728316941082e-06, "1": 0}, "score": 4.974320847684983}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8387571719271384, "2": 0.1589435613242565, "3": 0.0020882633321160434, "4": 5.2435956983028705e-05, "5": 0}, "score": 1.1633032904473328}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.26630028924516436, "4": 0.25652965680058487, "5": 0.22054174109333755, "2": 0.19797005442566196, "1": 0.05806033793257447}, "score": 3.383751861802561}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5525978263482079, "5": 0.27838136188920215, "3": 0.1482586641468815, "2": 0.020137319377081804, "1": 0.00054613814576525}, "score": 4.088216586322232}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7104735922324318, "4": 0.2574588699463421, "3": 0.029410503692214634, "2": 0.002332746383890723, "1": 0.0003103539927108996}, "score": 4.6754759457088895}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.32812983844756705, "4": 0.2957346734857099, "5": 0.22669748851085564, "2": 0.1237514698534796, "1": 0.025643332055767198}, "score": 3.574116317016189}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6356706726822968, "3": 0.21798646615020528, "4": 0.09200510631954892, "1": 0.03313778854162996, "5": 0.021195205045184712}, "score": 2.432446564374247}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8118440450606966, "3": 0.09340272113163976, "1": 0.04399166917157717, "4": 0.04081793544194136, "5": 0.009938358627170997}, "score": 2.160862846563865}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5025906084401377, "5": 0.3949298202971582, "3": 0.09830075217767005, "2": 0.00405674520713375, "1": 0.00011802925977992587}, "score": 4.288162655433779}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8932812259562564, "4": 0.0930606451467942, "3": 0.01205768937683716, "2": 0.0013540821963770606, "1": 0.00024348627074709958}, "score": 4.877787433548657}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8230790268590221, "3": 0.1426708428762217, "1": 0.01950093238383255, "4": 0.013318176801535131, "5": 0.0014206786485826703}, "score": 2.154069893498421}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8197439447401011, "3": 0.15008930430653267, "5": 0.0260508312891544, "2": 0.004072164511039581, "1": 3.472353009838244e-05}, "score": 3.8677118325933826}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9888663114269957, "4": 0.010963354245355564, "3": 0.00015149347549224616, "2": 9.32812992461087e-06, "1": 5.42957334918255e-06}, "score": 4.988683909915209}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9892727270102109, "4": 0.010640396826930115, "3": 8.421478991027425e-05, "2": 1.086973857774358e-06, "1": 0}, "score": 4.989187895649108}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.984314158614555, "4": 0.015619861522606557, "3": 6.157706981423081e-05, "2": 1.2573087927662753e-06, "1": 0}, "score": 4.984253162879959}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8027571573609529, "4": 0.19391479837930645, "3": 0.003099284501805513, "2": 0.00011684970752240974, "1": 0}, "score": 4.79951364705665}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"1": 0.988928092779677, "2": 0.011053509495945562, "3": 6.715320501095006e-06, "5": 2.4230538133048555e-07, "4": 0}, "score": 1.011068035977895}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6644209961975985, "1": 0.310308597764988, "3": 0.022095343367793514, "5": 0.0016670671401329044, "4": 0.0014997632749925007}, "score": 1.719785166773369}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9413153456014673, "4": 0.05520959049162293, "3": 0.0030867608700599525, "2": 0.00023781892338055723, "1": 0.00012932356994171663}, "score": 4.937384811746932}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9489124857106437, "4": 0.04997973778438288, "3": 0.001034847713298669, "2": 4.913784726656784e-05, "1": 1.4562308164184604e-05}, "score": 4.94774442176684}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9881987030580067, "4": 0.010689368816308649, "3": 0.0009093304486316146, "1": 0.00010216657382337561, "2": 8.705120928524361e-05}, "score": 4.986821974042689}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.769021924099944, "1": 0.1584368480621831, "3": 0.06602628227070143, "4": 0.004327613688873292, "5": 0.0021323647581498323}, "score": 1.9226375034670726}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9891563093213458, "4": 0.010674388552097095, "3": 0.0001454321359133229, "2": 7.8090596866308e-06, "1": 0}, "score": 4.98901114350575}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5415204217260763, "3": 0.34692491698955236, "5": 0.07491952061888986, "2": 0.03601444755721587, "1": 0.0005368504467045506}, "score": 3.6543261749612683}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8378409446795826, "4": 0.15873724355453522, "3": 0.003219194841232621, "2": 0.0001515142315201441, "1": 0}, "score": 4.834361359487823}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4629622785635029, "3": 0.3110791492457035, "1": 0.14737901162046138, "4": 0.04803083876988237, "5": 0.03001373406238146}, "score": 2.3499902578485434}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5523689545821469, "3": 0.20705581176606044, "4": 0.1827874639989342, "1": 0.03250083167415055, "2": 0.025278190262084596}, "score": 4.197255992808993}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.893854802777144, "4": 0.10373579965854487, "3": 0.002376551004776941, "2": 2.7297921341752667e-05, "1": 5.41612469050622e-06}, "score": 4.8914075256791465}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.48651674433187775, "4": 0.3046454919102824, "5": 0.10492602509733592, "2": 0.09763853867771385, "1": 0.006196463827784911}, "score": 3.4044971153250105}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8271471396616107, "5": 0.10367426109532496, "3": 0.06860440729714064, "2": 0.0005366595766244142, "1": 3.739496456154727e-05}, "score": 4.033884354407121}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7246105941070782, "4": 0.2320017881041626, "3": 0.04278728499873677, "2": 0.0005305190982961466, "1": 6.918517170651599e-05}, "score": 4.680555143139162}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7554116247162803, "4": 0.23185813069190442, "3": 0.01143048579875846, "2": 0.0010276317458582094, "1": 0}, "score": 4.742127828480413}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9751010873746575, "4": 0.024675572310261407, "3": 0.00016173570590797542, "2": 4.952941081236472e-06, "1": 0}, "score": 4.97498468029509}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7044500651495477, "4": 0.29180310561283557, "3": 0.0034895586921634973, "2": 9.892189090464244e-05, "1": 0}, "score": 4.700873645074281}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991421483652828, "4": 0.000854378716954613, "3": 2.7556285295010293e-06, "2": 5.734558383986763e-08, "1": 0}, "score": 4.999139937421643}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9859292495246619, "4": 0.01381618289932191, "3": 0.00023391283780740585, "2": 1.1434442334246433e-05, "1": 0}, "score": 4.985681556077771}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4263054802116621, "3": 0.389292184634027, "5": 0.13435012681579744, "2": 0.04907988511069752, "1": 0.0009448286213365554}, "score": 3.644053899498405}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996435060090888, "4": 0.000349157446985326, "3": 5.147790317120476e-06, "1": 5.275057875487389e-07, "2": 0}, "score": 4.999638436348584}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8339448132298751, "4": 0.16138814127148735, "3": 0.004372068678835243, "2": 0.00024450715149715204, "1": 0}, "score": 4.829125575940847}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998322311147737, "4": 0.00016477691980890913, "3": 1.6994498107846052e-06, "1": 1.1592377197459512e-07, "2": 0}, "score": 4.999831360287062}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995034483226098, "4": 0.0004926111684906694, "3": 2.9130206240750693e-06, "1": 7.9503085875136e-08, "2": 0}, "score": 4.9995012443051055}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5460410625115262, "5": 0.41724839210526843, "3": 0.035643007301037206, "2": 0.0010111625201334922, "1": 4.779669801677045e-05}, "score": 4.379442924859169}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9953566452596652, "4": 0.004494009460864144, "3": 6.778246668009548e-05, "1": 3.0032275428163636e-06, "2": 0}, "score": 4.995358048025783}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.990495501994731, "4": 0.009413564480808507, "3": 8.679374509604219e-05, "2": 1.489901570881537e-06, "1": 0}, "score": 4.990408352907594}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9973561415661291, "4": 0.0025435523806190017, "3": 4.318751971235092e-05, "1": 2.7673150606959152e-06, "2": 0}, "score": 4.997358859770523}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976694107501607, "4": 0.0023030015157051846, "3": 1.166512426196797e-05, "1": 0, "2": 0}, "score": 4.9976736311939085}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7219085573356645, "4": 0.24874654313119965, "3": 0.024513999903492397, "2": 0.0037493117094229015, "1": 0.0009389659888678612}, "score": 4.687177042563714}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9932863042364497, "4": 0.0066355255871144245, "3": 7.422979043674438e-05, "2": 1.4079849348022186e-06, "1": 0}, "score": 4.993211773686696}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.967221942807303, "4": 0.03271935107877614, "3": 5.042721744395736e-05, "2": 5.395156739155958e-07, "1": 0}, "score": 4.967177921916753}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.979571325474564, "4": 0.0201168159350337, "3": 0.0002959269276985169, "2": 5.317602574883781e-06, "1": 0}, "score": 4.979275157427119}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.961127590840676, "4": 0.0382905442385122, "3": 0.0005374477564439512, "2": 3.020862736629433e-05, "1": 1.0751857796961164e-05}, "score": 4.960500790399216}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6573204973738866, "1": 0.24634196665555425, "3": 0.0782447300056869, "4": 0.013385356072637558, "5": 0.004243272463496673}, "score": 1.8713435734766435}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6745171684925, "4": 0.27885729931400577, "2": 0.04168080366221113, "5": 0.004864292502118689, "1": 7.574856936680053e-05}, "score": 3.2467547401702235}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9271467959686742, "4": 0.07155377600633056, "3": 0.0012339503368170846, "2": 4.174704030827683e-05, "1": 0}, "score": 4.925851322602957}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9906295518496072, "4": 0.009301071224743237, "3": 6.342642406446287e-05, "2": 2.2407296691152926e-06, "1": 1.8496650302462393e-06}, "score": 4.990557937514755}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8729138768118243, "4": 0.1143252754593333, "3": 0.011625542057426125, "2": 0.0007880647511280417, "1": 0.00033555445658995145}, "score": 4.858715577230792}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6550678113021757, "3": 0.27461265541062807, "4": 0.03571478608119097, "1": 0.031807584860850724, "5": 0.002721772381594748}, "score": 2.3224242674107143}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7681037222043372, "4": 0.18414809149605899, "3": 0.03100933471455845, "2": 0.009394940305456125, "1": 0.007044719147032202}, "score": 4.6973789997479045}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6467560910658546, "5": 0.2987757759881597, "3": 0.05059219315835192, "2": 0.003730816009313377, "1": 0.00011211213300259121}, "score": 4.240393550198789}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9568356163811087, "4": 0.04114747148668726, "3": 0.00159269377208778, "2": 0.000248400300043771, "1": 0.0001469579597769182}, "score": 4.954332790269644}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3622446017115157, "4": 0.3013952960235363, "2": 0.17848669827623942, "5": 0.1335223499230838, "1": 0.02430208572535212}, "score": 3.3413658422614825}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8152866742858133, "1": 0.13456290420718933, "3": 0.04821831745172318, "4": 0.0014231109412257287, "5": 0.0004240331168517437}, "score": 1.9177667479406761}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9199221611169887, "4": 0.07648152275023715, "3": 0.0026723944785946754, "2": 0.0007714690527939661, "1": 0.00012751213773184517}, "score": 4.915347121301219}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8392952645932519, "1": 0.1593890037918921, "3": 0.001266303819809476, "4": 2.98924385755395e-05, "5": 1.570747255382714e-05}, "score": 1.841983602454303}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.733259672455891, "4": 0.1379679040808399, "2": 0.05449796050171715, "3": 0.044071546889799466, "1": 0.029593092688556453}, "score": 4.491712784450761}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4321918033655469, "4": 0.3525079160861437, "2": 0.11057658734070137, "3": 0.09966030756407862, "1": 0.005021268941650818}, "score": 4.09631857091565}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5574581030230735, "3": 0.3577011921149164, "5": 0.04757079292895859, "2": 0.037037009852022164, "1": 0.00022394456822826393}, "score": 3.6151202998404717}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5934717292607326, "5": 0.30917018289130493, "3": 0.091832087995204, "2": 0.005261805816650615, "1": 0.0002542679311140733}, "score": 4.2060537247803635}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8691282423315763, "4": 0.128880688235655, "3": 0.0019206550101528179, "2": 4.4785013258024214e-05, "1": 0}, "score": 4.86714024158713}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8550368342322017, "4": 0.14286865032849652, "3": 0.002081339296355759, "2": 9.032530475025507e-06, "1": 0}, "score": 4.8529409641317125}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99868764888687, "4": 0.0013097316632039295, "3": 2.3974808924538344e-06, "2": 5.1649878177460156e-08, "1": 0}, "score": 4.998685318201461}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6609645443361728, "3": 0.1731571872825155, "1": 0.1316137476659938, "4": 0.023584895335802068, "5": 0.010635172610959642}, "score": 2.1206241101966574}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8729006086217352, "3": 0.11643369612124017, "1": 0.007376002159160898, "4": 0.00306698495287493, "5": 0.00021589896809622044}, "score": 2.115840149548187}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5790104229097064, "3": 0.3585952728982189, "5": 0.03877981110958078, "2": 0.023454884770599288, "1": 0.00015292912181793811}, "score": 3.6328135287964747}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.47795729093067657, "3": 0.24034485287385893, "5": 0.23877394773553912, "2": 0.042167647452925575, "1": 0.0007476978540729784}, "score": 3.9118499515512637}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.582786173036507, "5": 0.2113515538444315, "3": 0.19301638448033961, "2": 0.012479690700022732, "1": 0.0003475803488410864}, "score": 3.9923329041746776}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8207065609863742, "3": 0.17175109025179514, "1": 0.004374942071763458, "4": 0.003004597990932669, "5": 0}, "score": 2.1734135774008454}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5174516438729345, "4": 0.36492781940884966, "3": 0.10518404012773815, "2": 0.010815013189734542, "1": 0.001005807075049807}, "score": 4.387858951714857}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6695758277469953, "4": 0.3187075078824377, "3": 0.011552331510556046, "2": 0.00012397916880249452, "1": 0}, "score": 4.657802082640955}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972754047653408, "4": 0.002714451423422296, "3": 9.499123754312253e-06, "2": 1.5266940576028962e-07, "1": 0}, "score": 4.99726609097572}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.99908645074044, "5": 0.0009054671134174634, "3": 6.540349196240542e-06, "2": 2.9949293769084394e-07, "1": 0}, "score": 4.000898328894343}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9401259362103813, "1": 0.03057384726500783, "3": 0.028969492079262086, "4": 0.0002765740391920943, "5": 4.1332414959333066e-05}, "score": 1.9990727782523963}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4887596615503449, "3": 0.3692970297776973, "4": 0.12897324490097917, "5": 0.011052705935014995, "1": 0.0018290583635409367}, "score": 2.658630735767649}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.4837978619987686, "3": 0.3482247062403143, "5": 0.14636492346213362, "2": 0.021222362889343944, "1": 0.0002969638926860108}, "score": 3.754781749956599}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6116047551639793, "4": 0.35195941793071467, "3": 0.03487869830064448, "2": 0.0015095933032932892, "1": 4.428435958608091e-05}, "score": 4.57357588183979}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4471467940309279, "4": 0.25844538085232427, "2": 0.20819973408739395, "5": 0.07916824559630962, "1": 0.005636418685504807}, "score": 3.197586598904398}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7450193781509379, "3": 0.21794158735725522, "4": 0.01813109244183658, "1": 0.015878749073103462, "5": 0.0029523878363389316}, "score": 2.247201172997673}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.44445198060448277, "3": 0.32911521235168634, "5": 0.14353892876213686, "2": 0.08049700501760354, "1": 0.0022065280872791983}, "score": 3.646742881324692}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.786264507207022, "4": 0.20327573928980047, "3": 0.010083068983796963, "2": 0.00030991484244898346, "1": 0}, "score": 4.775613395994202}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.47616419821526496, "5": 0.28269754455835255, "3": 0.19044106544923456, "2": 0.04806176617371559, "1": 0.0025282017492693058}, "score": 3.9885471134912467}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7167428140572454, "4": 0.26025681121863653, "3": 0.022154443347789467, "2": 0.0008097261126567596, "1": 2.768438561269682e-05}, "score": 4.692891769373579}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9988961150297694, "2": 0.0010912319408463496, "3": 6.829927495711002e-06, "5": 1.0271793576072217e-06, "4": 0}, "score": 1.0011090058319743}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6000766031492136, "2": 0.29993916746627663, "3": 0.06751950904323321, "4": 0.027582761078695162, "5": 0.004827787455584391}, "score": 1.5370667124854593}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5537588642920688, "4": 0.40623120947821756, "3": 0.03949669426780003, "2": 0.00031193772170480527, "1": 0}, "score": 4.5137417078276005}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5423392504561381, "4": 0.4378823114633032, "3": 0.018156348496651622, "2": 0.0013505747991513777, "1": 0.00021898134815867944}, "score": 4.520852170471183}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.643829718569502, "2": 0.264133981207196, "3": 0.08002567166274366, "4": 0.00859732646686972, "5": 0.0027294995543885865}, "score": 1.4612106791844253}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6851442903878788, "3": 0.2291289576695821, "5": 0.06538947932824435, "2": 0.02020034692939373, "1": 0.0001261990671150217}, "score": 3.7954790367803284}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9935527823714322, "4": 0.006278945039212723, "3": 0.0001379435519953697, "1": 1.2595008163574086e-05, "2": 9.72634864427625e-06}, "score": 4.993365555651699}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9955822779686809, "4": 0.004137531189746736, "3": 0.00021399594322813072, "1": 4.246272184495841e-05, "2": 2.0647836789519343e-05}, "score": 4.995202667729446}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9751896198461056, "4": 0.024566513578853737, "3": 0.00022473738842052464, "2": 1.0420192997266247e-05, "1": 0}, "score": 4.974952532927083}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9930833479111326, "4": 0.006748635113171855, "3": 0.00015054899177552593, "2": 1.0562939042404767e-05, "1": 0}, "score": 4.992918529188277}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6721952500439611, "3": 0.2720310676247547, "4": 0.03349332880940111, "1": 0.018550970003537743, "5": 0.003717588773584326}, "score": 2.3316234329745207}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.527917926285201, "5": 0.43015145989491993, "3": 0.037430185543432755, "2": 0.004249499787633763, "1": 0.000213338383052546}, "score": 4.383596679066797}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.68871498381736, "5": 0.2807197888164382, "3": 0.02982852883426587, "2": 0.0007032894608825234, "1": 1.7190683119582998e-05}, "score": 4.249437154479586}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6257990286010489, "5": 0.30491735692283584, "3": 0.0675764992909684, "2": 0.0016591653570770324, "1": 3.934695376293558e-05}, "score": 4.233906498324629}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5086568575344871, "4": 0.4672971164294579, "3": 0.02252445209702501, "2": 0.0013465230868999636, "1": 0.00013878535874521736}, "score": 4.483040520890241}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6163227733306372, "2": 0.1482660179589962, "4": 0.14662616890040517, "3": 0.07580287941879181, "1": 0.012952052618990198}, "score": 4.20513787638133}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6669695741993356, "4": 0.27286994206644677, "3": 0.04047703511062294, "2": 0.01746063605442929, "1": 0.00220324721505962}, "score": 4.5849729705379865}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.959460054480761, "4": 0.03953794244095329, "3": 0.0009707884321246837, "2": 2.5733832297253197e-05, "1": 0}, "score": 4.958443051432006}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.983928320109908, "4": 0.01580998937190113, "3": 0.00023619920972360112, "2": 1.740886497784625e-05, "1": 6.659987168936126e-06}, "score": 4.983638722391839}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969590631433952, "4": 0.002987462243390558, "3": 4.4340037856448816e-05, "1": 3.425808690863184e-06, "2": 0}, "score": 4.996910136806825}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9474807811291321, "4": 0.05032317864319735, "3": 0.0020710689583417884, "2": 9.034544113768629e-05, "1": 1.745485019148686e-05}, "score": 4.945192886624202}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.40095974630243714, "4": 0.3389169116570441, "3": 0.21681665292107122, "2": 0.04088194319876656, "1": 0.0024016379385791795}, "score": 4.09517649250478}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7680139591677284, "4": 0.22036055230606477, "3": 0.01094222631945229, "2": 0.0005574940094884106, "1": 8.152580190739577e-05}, "score": 4.755745603419355}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974527916547152, "4": 0.0025082135808720887, "3": 3.592209471900314e-05, "2": 1.1764936807754572e-06, "1": 9.821556874174182e-07}, "score": 4.997412481760854}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.42430811556775994, "5": 0.36309059603578586, "3": 0.1914722096908626, "2": 0.01916628180093048, "1": 0.0019305217033048934}, "score": 4.127498372668798}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7634571568830505, "1": 0.1900554513862666, "3": 0.04434159958521688, "4": 0.0016287104699439098, "5": 0.00040349337065205754}, "score": 1.8587380035400738}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6922976886205728, "4": 0.2753575621162383, "3": 0.03165387515911906, "2": 0.0006431178300811319, "1": 2.9110372616403035e-05}, "score": 4.659282539600652}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7987212321712653, "4": 0.19684513030469658, "3": 0.004369103236376771, "2": 4.536752578223199e-05, "1": 9.587963962535528e-06}, "score": 4.7942402378581725}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8653423067361885, "4": 0.13279011233771856, "3": 0.0018394125953266718, "2": 2.363606108686821e-05, "1": 3.5238972765107724e-06}, "score": 4.8634459210018965}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6507365719822245, "5": 0.3056778222955959, "3": 0.0432148972252384, "2": 0.00035489769255836733, "1": 1.4920641024544934e-05}, "score": 4.261708600725575}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5051869298902031, "4": 0.31256444720887006, "3": 0.16339413348260343, "2": 0.01750870137846167, "1": 0.0011952263467840416}, "score": 4.303235370241068}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9826136457042316, "4": 0.01693555535369026, "3": 0.00044018784574921294, "2": 7.341150380718613e-06, "1": 0}, "score": 4.982161987174332}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991640376114125, "4": 0.0008324464187856711, "3": 3.0905731463470166e-06, "2": 4.8866829694053495e-08, "1": 0}, "score": 4.999161225518609}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5395367381170034, "5": 0.35699378725535147, "3": 0.10014596572581866, "2": 0.003241120096905527, "1": 7.067172459953379e-05}, "score": 4.250156497265694}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987554238281279, "4": 0.0012210361224195253, "3": 2.074947734079961e-05, "2": 5.289102918988452e-07, "1": 0}, "score": 4.998735875333001}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5514758946209752, "2": 0.25325431436660883, "5": 0.10589801189175088, "4": 0.08215991072185683, "1": 0.007191606477564305}, "score": 3.02631894045592}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9499738795272739, "1": 0.031924804525851766, "3": 0.01794597182670926, "4": 0.00013183901012303858, "5": 2.1061201533777043e-05}, "score": 1.9863479955614551}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.821398552250656, "4": 0.17572175015787303, "3": 0.002779838073273323, "2": 8.601782635442247e-05, "1": 7.056206315233269e-06}, "score": 4.818431063357864}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6941940823551224, "4": 0.21129041868353174, "3": 0.08457572433007365, "2": 0.009772870974045136, "1": 0.00014179715606875312}, "score": 4.589662028959166}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4982843704152304, "5": 0.40404977627865996, "3": 0.08179449793859618, "2": 0.015493967877445268, "1": 0.0003661423008461494}, "score": 4.290172178723691}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.684302956882896, "3": 0.18726510355459772, "1": 0.06732400630948554, "4": 0.04741147457198011, "5": 0.013575377568926697}, "score": 2.255521117876974}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.31435376095401485, "5": 0.2544083311045244, "2": 0.18046619573410874, "3": 0.1618623655873605, "1": 0.08765209202141111}, "score": 3.467988423984269}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.77143996974413, "4": 0.2238886161784116, "3": 0.004488074549717858, "2": 0.00012607040969300437, "1": 0}, "score": 4.766743665108495}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938767400386047, "4": 0.00606070590325016, "3": 5.333696179801303e-05, "2": 2.899903782414564e-06, "1": 0}, "score": 4.993823881446077}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8233115877637439, "5": 0.10919860396023325, "3": 0.05690642652654877, "2": 0.009920539242894594, "1": 0.0005704439161386382}, "score": 4.030742607773104}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6091814976348993, "2": 0.38992001524791586, "3": 0.000865983848732608, "4": 6.511126989891258e-06, "5": 0}, "score": 1.3916816969724266}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8309153454614792, "5": 0.13319683265832144, "3": 0.03459338500580246, "2": 0.0012320959936284054, "1": 5.8911514149649856e-05}, "score": 4.095962850214609}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9687673023342618, "4": 0.0309312400792386, "3": 0.00028747490169206045, "2": 8.76167466047303e-06, "1": 2.4432241938639153e-06}, "score": 4.968457664578764}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8930394876413627, "4": 0.105916789273825, "3": 0.001004303512610653, "2": 3.140639573384371e-05, "1": 5.822615491527032e-06}, "score": 4.8919568573766945}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4583648482936552, "3": 0.4517709840533975, "4": 0.08197629982651575, "1": 0.0050624663170187965, "5": 0.002824827438404614}, "score": 2.619135955132626}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8405942388929303, "1": 0.0862897896650955, "3": 0.07042915274803008, "4": 0.002208762223986026, "5": 0.0004761592027943592}, "score": 1.9899853461388157}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5801176042776326, "4": 0.37928028840017425, "3": 0.03930191631892159, "2": 0.0011564630808219023, "1": 0}, "score": 4.53858017080609}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9396593152472109, "4": 0.059392085632540254, "3": 0.0008783986711653973, "2": 2.2985039734343665e-05, "1": 0}, "score": 4.938779271344162}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9928728239468825, "4": 0.007026953669540118, "3": 8.992918775931195e-05, "2": 4.2627886464719386e-06, "1": 0}, "score": 4.992780356051609}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9894610708074535, "4": 0.010239344244954447, "3": 0.00025212892352159384, "2": 2.571304775884134e-05, "1": 0}, "score": 4.98917902348449}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.452804234647586, "1": 0.21634065654530002, "3": 0.12548020022353382, "2": 0.10282773156859212, "4": 0.1023454114325004}, "score": 3.4725401784128263}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6878047327570584, "4": 0.22200099836063328, "3": 0.055923958216765796, "2": 0.022594546661154295, "1": 0.011634028311298615}, "score": 4.551812626566515}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8125144096350991, "4": 0.18043129694667528, "3": 0.006704685960230678, "2": 0.00031056867671529914, "1": 2.8832826813808633e-05}, "score": 4.805110304760108}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9732510243379614, "4": 0.025247654971235402, "3": 0.0013519034724865727, "1": 7.318207822246066e-05, "2": 6.563627777551149e-05}, "score": 4.971558599491086}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9860946392237756, "4": 0.012747233644215957, "3": 0.0009696300024568626, "1": 0.00010089552322733187, "2": 5.082887293376824e-05}, "score": 4.984756877107865}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5535067841988884, "4": 0.3777505204753721, "2": 0.05936185681714259, "5": 0.009139117973298291, "1": 0.0002394380113201429}, "score": 3.3361887909411627}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9582001519064431, "4": 0.04160774712862132, "3": 0.00017737294644999885, "2": 9.191048837319831e-06, "1": 0}, "score": 4.958009701332957}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984493244417063, "4": 0.0015412609482862514, "3": 6.4072269098924664e-06, "2": 1.8325595502167801e-07, "1": 0}, "score": 4.9984453704395575}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996933056203395, "4": 0.000304798090175447, "3": 1.6056321756862424e-06, "2": 3.3264435955210995e-08, "1": 0}, "score": 4.99969189077286}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6483105069543514, "4": 0.33845369184204954, "3": 0.013041652565892953, "2": 0.00018879647027593823, "1": 4.346241975197195e-06}, "score": 4.634878861362788}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5034380767437894, "2": 0.48605771839678724, "3": 0.009352304457561035, "4": 0.0006660458806045876, "5": 0.0004565994629787091}, "score": 1.5086017419792401}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9179069271944734, "4": 0.07993275182499138, "3": 0.0019891014000350104, "2": 0.00012821064276958226, "1": 2.4371820271250352e-05}, "score": 4.9156053532926}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9844211160644525, "4": 0.015404555524922928, "3": 0.00016787397648953658, "2": 1.6689481170783967e-06, "1": 0}, "score": 4.9842546143284245}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990722932562269, "4": 0.0009153244183087708, "3": 9.198786360022519e-06, "2": 4.857838816071997e-07, "1": 0}, "score": 4.999064818134435}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6919966668962387, "5": 0.2832953460270947, "3": 0.02382174642862867, "2": 0.0008631362498725585, "1": 1.673922148929856e-05}, "score": 4.257698749732325}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6253351205911301, "5": 0.19953961319144156, "3": 0.1685614175089547, "2": 0.006441666493880306, "1": 0.0001157370211012185}, "score": 4.017747766019209}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8297819114561361, "4": 0.16714733667251294, "3": 0.002946819576115992, "2": 7.276649079541149e-05, "1": 0}, "score": 4.826731859299066}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9723787265907651, "4": 0.02730421481172657, "3": 0.0003107238445192513, "2": 4.362933088771965e-06, "1": 0}, "score": 4.972061193609675}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8257467586991664, "4": 0.1640583535689614, "3": 0.009217503943763286, "2": 0.000900205038528419, "1": 6.666203216671998e-05}, "score": 4.814537424841767}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5177974895380674, "4": 0.4691635268432514, "3": 0.012514784169402576, "2": 0.0004905899065680586, "1": 2.1498121472930496e-05}, "score": 4.504243138292165}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5209176558041366, "4": 0.4501893801366383, "3": 0.026930828706982383, "2": 0.0019098770704801772, "1": 4.788654455513893e-05}, "score": 4.490025555585483}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.34244867038505566, "2": 0.31833572949131417, "3": 0.3003921774131381, "5": 0.030215041973758856, "1": 0.008584506244771108}, "score": 3.0673756209104366}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7396328977470279, "5": 0.16702852045151925, "3": 0.08770579537274664, "2": 0.005476689863690987, "1": 8.227864183002035e-05}, "score": 4.068127538459302}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947707175507928, "4": 0.005181797371398111, "3": 4.3219447085129546e-05, "2": 1.4050319713896385e-06, "1": 0}, "score": 4.994727533556106}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7668480321775041, "4": 0.22952909084959888, "3": 0.00304901100988576, "2": 0.000495873353266214, "1": 7.358870563876948e-05}, "score": 4.762589866716814}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"2": 0.949882990374687, "3": 0.04344858473796308, "1": 0.006588519594089561, "4": 7.395365091343195e-05, "5": 4.377941155100326e-06}, "score": 2.0370211645294165}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.48029460641082966, "4": 0.3440756957604522, "5": 0.09050791260488887, "2": 0.08082556216978706, "1": 0.004080902965414731}, "score": 3.4361980750777983}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5841236436408633, "4": 0.4037271905641, "3": 0.011799926220854762, "2": 0.00031267038667990866, "1": 0}, "score": 4.571719283956342}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9769909773874114, "4": 0.022834550893518515, "3": 0.00016356305246172198, "2": 3.0138024621621573e-06, "1": 0}, "score": 4.976829098663054}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3734808938755572, "3": 0.3473398442747199, "5": 0.2560913403238129, "2": 0.022081072177248143, "1": 0.001002251209156881}, "score": 3.8615819616016753}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6458246317066437, "2": 0.3523813884573371, "3": 0.0017816328566077901, "4": 3.7224704895822245e-06, "5": 0}, "score": 1.3559588915526573}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7967883131904284, "3": 0.15866768426571698, "1": 0.03867231923949015, "4": 0.005474835770418846, "5": 0.0003874929123685324}, "score": 2.132108751131544}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5341655603314167, "4": 0.4098214917776166, "3": 0.04808471153018402, "2": 0.007008286810707985, "1": 0.000850529381989682}, "score": 4.469545282946314}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4944672493207134, "5": 0.4098808382262052, "3": 0.08301179274608463, "2": 0.011599671502741285, "1": 0.0009792407808143003}, "score": 4.300750388288561}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9064890756414512, "4": 0.07705914770447803, "3": 0.012271779527612482, "2": 0.0030329740687970288, "1": 0.0011153347443263815}, "score": 4.8848333826207435}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6194752377869682, "3": 0.3292902165105567, "2": 0.026487273675549157, "5": 0.024593399132435058, "1": 0.00015158909804102318}, "score": 3.6418730500876}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6746190957370686, "3": 0.28358556068193, "4": 0.03333972333447531, "1": 0.006806399543687769, "5": 0.0016238409162743325}, "score": 2.3483389713247598}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5677081912919528, "5": 0.4184572687502174, "3": 0.01356465182986668, "2": 0.0002573153969521451, "1": 7.33832458182323e-06}, "score": 4.4043580877272746}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9237107014807964, "4": 0.07483843418218683, "3": 0.0013984423065232507, "2": 3.953809185441379e-05, "1": 0}, "score": 4.922245065139394}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7564248649391225, "4": 0.23642155911463594, "3": 0.006725466418422413, "2": 0.00039179022567333537, "1": 2.645821134533956e-05}, "score": 4.7488438278522995}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9064070783484621, "3": 0.07781350319035872, "1": 0.011851095125702081, "4": 0.0034821651817669237, "5": 0.00043238965374272536}, "score": 2.0742249293553563}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5975745100133647, "5": 0.3926576171545491, "3": 0.009350030253671359, "2": 0.000295602178251977, "1": 0}, "score": 4.382763171667647}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5365631963997388, "4": 0.4381498516776086, "3": 0.024409033250775505, "2": 0.0006650462306169944, "1": 0}, "score": 4.510932834207468}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8701281320147501, "4": 0.1293046281441468, "3": 0.0005515176589105118, "2": 9.078750363386354e-06, "1": 0}, "score": 4.8695642337458205}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9300672161653191, "4": 0.06659094977059439, "3": 0.003151910191300929, "2": 0.00014111195154992254, "1": 3.255378218175086e-05}, "score": 4.926550484710995}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.619829362870445, "3": 0.23221799845411847, "2": 0.09391854640223755, "5": 0.053211502159396205, "1": 0.0007620632503604781}, "score": 3.630847877529615}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6602010098182942, "3": 0.20201773265763728, "4": 0.1009716393587859, "1": 0.02705001822331108, "5": 0.009516501378336033}, "score": 2.4055590881186966}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7230174222132073, "4": 0.27317414319487515, "3": 0.0037256572491126266, "2": 5.484689400062576e-05, "1": 0}, "score": 4.71920215881517}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990184621872592, "4": 0.009587217290736754, "3": 0.00016962999380115037, "2": 1.0838998017879428e-05, "1": 0}, "score": 4.990040530742146}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9407436438521791, "4": 0.05867638106410646, "3": 0.0005539489630052367, "2": 1.0873227312755886e-05, "1": 0}, "score": 4.940182194915122}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6204169853450275, "4": 0.3602208728404948, "3": 0.015515164166352556, "2": 0.0035523081630500363, "1": 0.0002698158145721033}, "score": 4.597002595114647}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9188262671834813, "4": 0.07323437239425529, "3": 0.006232280261919814, "2": 0.0013142370129935713, "1": 0.00024060463265894054}, "score": 4.90938214198418}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9120341722841139, "4": 0.08618524393628203, "3": 0.0016333185722050222, "2": 0.00011586277978073755, "1": 0}, "score": 4.910197710570071}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8446376501360945, "4": 0.15328543613474446, "3": 0.0019336903564837193, "2": 0.00011399203276937451, "1": 0}, "score": 4.842500603135575}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9931930514462648, "4": 0.0067398743275220345, "3": 5.200727215636312e-05, "2": 2.3965005232679827e-06, "1": 0}, "score": 4.993148834819226}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5054348404586058, "5": 0.48158058468135945, "3": 0.012104311107010676, "2": 0.000791563859722122, "1": 7.130058684020394e-05}, "score": 4.467687381530463}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6916227506758396, "3": 0.28893443070076236, "4": 0.016535957942435238, "1": 0.0021770032583830526, "5": 0.0006941787956631492}, "score": 2.321923365497893}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9824122698491106, "4": 0.01747900207351969, "3": 8.558560113545881e-05, "1": 0, "2": 0}, "score": 4.982349418246041}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9499452591453711, "4": 0.04945537654143437, "3": 0.0005819129452669218, "2": 1.1932199162394191e-05, "1": 2.694922799066702e-06}, "score": 4.949334078186324}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9904096693737093, "4": 0.009534628522966644, "3": 5.001978153886746e-05, "2": 1.7294796068406428e-06, "1": 0}, "score": 4.990360105370153}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4954626234723557, "5": 0.47415903342703636, "3": 0.02937023888984367, "2": 0.0009560337903338613, "1": 3.424517085949807e-05}, "score": 4.442781884141537}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8022825230656907, "4": 0.19407129256060032, "3": 0.0034226800309785617, "2": 8.521594446754194e-05, "1": 0}, "score": 4.798799875901148}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.989405510170474, "4": 0.010502846114758099, "3": 6.72683307780033e-05, "2": 4.007936650780939e-06, "1": 0}, "score": 4.989350376508088}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9803555303863184, "4": 0.01943219018739969, "3": 0.00018773146385441227, "2": 7.294856844248236e-06, "1": 0}, "score": 4.980170120187348}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9923978119236532, "4": 0.007468261782652418, "3": 0.00012388646705900462, "2": 6.186135374058075e-06, "1": 2.3291364066819924e-06}, "score": 4.992256078525448}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8882403253056369, "4": 0.10797797584662401, "3": 0.003348787965347103, "2": 0.00021054692669910681, "1": 0.00014599196091470007}, "score": 4.884099988083821}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6664941410664404, "3": 0.17834564245929388, "1": 0.10563727363086246, "4": 0.043743922067534934, "5": 0.005495375272554152}, "score": 2.176732468151044}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998207895501114, "4": 0.0001775589307366225, "3": 9.509465309585499e-07, "1": 0, "2": 0}, "score": 4.999820539050476}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9497141427843537, "4": 0.0484441253404537, "3": 0.0016803896129235704, "2": 0.00010639467811753462, "1": 0}, "score": 4.947873047149218}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3849182903792829, "2": 0.27208354747921876, "4": 0.20123693178935906, "5": 0.08529409953261444, "1": 0.05638929181163121}, "score": 2.986961984885945}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8170310254468619, "2": 0.18203671162886692, "3": 0.0009195138973543684, "5": 7.128811695860348e-06, "4": 4.702698806016497e-06}, "score": 1.1839185315150487}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7689083710168104, "4": 0.1335772388878118, "3": 0.04800867285099386, "2": 0.040196071982877356, "1": 0.009186974622718872}, "score": 4.613021830111395}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9985675829899856, "4": 0.0014115760963983063, "3": 1.7666594817897397e-05, "2": 5.490370013416939e-07, "1": 0}, "score": 4.998551439800083}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872279616819658, "4": 0.012119058292479138, "3": 0.0004704477298544124, "2": 0.00011544457653619949, "1": 5.9180290633232716e-05}, "score": 4.986356883473701}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.98020626203426, "4": 0.016773466770059312, "3": 0.0027525935573238444, "2": 0.00020160464124166396, "1": 6.390320764201778e-05}, "score": 4.976860869153959}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6116938724688447, "5": 0.33763231535601695, "3": 0.04080536545370279, "2": 0.009263277048526076, "1": 0.0004967406992045156}, "score": 4.276840191205461}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6095937666339428, "5": 0.3325778536428194, "3": 0.04584011948558366, "2": 0.01015688579558568, "1": 0.0017628419992040416}, "score": 4.261153334044396}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8021985926586037, "4": 0.19517458759093406, "3": 0.002369940570234319, "2": 3.9707399589274177e-05, "1": 0}, "score": 4.799922957982349}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.961103478374145, "4": 0.03827301118462678, "3": 0.0005468917897863828, "2": 1.6868442319844016e-05, "1": 0}, "score": 4.9605802445702105}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8470634802262919, "4": 0.15128235312302005, "3": 0.0015922757448410838, "2": 4.368468390584163e-05, "1": 0}, "score": 4.8453992266395876}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5878055400395321, "2": 0.38340465771357707, "4": 0.023887129016049433, "1": 0.003799267477162212, "5": 0.0010999517101555828}, "score": 2.6350825793278054}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5308332485082587, "2": 0.2523686660598469, "4": 0.12084115069998812, "1": 0.048701838405816655, "5": 0.0469816725060896}, "score": 2.8649952393233042}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9326208201617431, "4": 0.06565735178263037, "3": 0.001656104700629289, "2": 3.134543235203758e-05, "1": 0}, "score": 4.930934028174418}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997471559204534, "4": 0.00024870403075209096, "3": 3.4378097154165112e-06, "1": 1.0040407930362345e-07, "2": 0}, "score": 4.999744018579441}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6574643742818177, "3": 0.17833417520315997, "5": 0.15105522206239116, "2": 0.012591528908183339, "1": 0.0005489978679377941}, "score": 3.9458906869252512}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7560833027879517, "3": 0.19733734570666275, "1": 0.0237178962444018, "4": 0.018310958009676047, "5": 0.004543948187622971}, "score": 2.223874676213994}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.45646979847845076, "4": 0.4393546206859471, "2": 0.07356918669093855, "5": 0.02975408040276841, "1": 0.0008439021551548704}, "score": 3.4236093537170587}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7447541388767688, "4": 0.2517063119199874, "3": 0.003466398916883883, "2": 5.5526120960219566e-05, "1": 0}, "score": 4.74118975056872}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5006478446204407, "5": 0.489989635569573, "3": 0.009220192159836148, "2": 0.00013461428730365994, "1": 3.648049196355707e-06}, "score": 4.480491224035073}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5830728519356746, "5": 0.23835924752330434, "3": 0.1734628020479137, "2": 0.005045724641052872, "1": 5.4200956612353915e-05}, "score": 4.054642675984296}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5382137138817171, "3": 0.4494954398773038, "4": 0.011773877178700431, "1": 0.0002876658484140802, "5": 0.00022312977613776885}, "score": 2.4734278403919943}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5169051415162269, "5": 0.46301593900115073, "3": 0.018867166308671444, "2": 0.0011579019213583818, "1": 0}, "score": 4.4418567633899375}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9972176588060352, "4": 0.0027764059817570377, "3": 4.714578695282572e-06, "2": 5.683275527824198e-08, "1": 0}, "score": 4.997213991120227}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7547476681243711, "4": 0.24402280376563162, "3": 0.0012024754163224862, "2": 1.4631468090753715e-05, "1": 0}, "score": 4.75352528947947}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9258259008995074, "4": 0.07321549500645189, "3": 0.0009187633288046363, "2": 3.5639071781177386e-05, "1": 2.1596184400442084e-06}, "score": 4.924831269146649}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5976096245232273, "2": 0.40197367804775797, "3": 0.00030638961937382595, "4": 1.125726447040036e-06, "5": 0}, "score": 1.402633794862334}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.834583667726087, "1": 0.16371419252204497, "3": 0.0016199473990292969, "4": 5.50971312821306e-06, "5": 0}, "score": 1.8379043443804823}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.8561478207133221, "3": 0.09335941099397621, "1": 0.03662434850728918, "4": 0.012472296178927622, "5": 0.001037376862137165}, "score": 2.084822215124478}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6297428358469463, "5": 0.22631102703999212, "3": 0.1334513215794564, "2": 0.010232278464656807, "1": 0.00014480587581544645}, "score": 4.071969203924022}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9443781749517158, "3": 0.03197981680553571, "1": 0.023370395667530523, "4": 0.0002417046576654709, "5": 0}, "score": 2.0090931024090932}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5267258207798485, "3": 0.26695811648078094, "5": 0.15623949884752236, "2": 0.04892748377491712, "1": 0.0010617391582828503}, "score": 3.788222700509701}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5061935059366143, "5": 0.45137427752276377, "3": 0.03819366174660775, "2": 0.003996525181618991, "1": 0}, "score": 4.40528565654328}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.36411322573605587, "2": 0.30222225154633614, "4": 0.2951373906631031, "5": 0.031192275342414283, "1": 0.007109784820293486}, "score": 3.0410893682228473}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9958101386638963, "4": 0.00414182610595863, "3": 4.321713490656182e-05, "2": 8.412230434063625e-07, "1": 0}, "score": 4.995769199129744}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5125561054052229, "4": 0.3161551199255234, "2": 0.12170608259491911, "5": 0.04788156083167851, "1": 0.001684494096036056}, "score": 3.2868479431331767}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9756560153311814, "4": 0.02386896259967506, "3": 0.0004171060716693612, "2": 1.6582444209047012e-05, "1": 0}, "score": 4.975246054755844}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998508202684029, "4": 0.00014729649938281228, "3": 1.0975424652883294e-06, "1": 0, "2": 0}, "score": 4.999850508298232}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9954922515338908, "4": 0.004469101934721258, "3": 3.12287629001848e-05, "1": 0, "2": 0}, "score": 4.99546840692517}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996127775399759, "4": 0.00038235552059040354, "3": 3.3533691536998357e-06, "1": 5.548583394580813e-07, "2": 0}, "score": 4.999608717932618}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999077652424261, "4": 0.0009009372028091946, "3": 1.759504904068915e-05, "1": 1.4418781836900346e-06, "2": 0}, "score": 4.999058102950834}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6415468921090818, "3": 0.31238721092337546, "1": 0.02999118721427288, "4": 0.01430793500727903, "5": 0.0017237105763176785}, "score": 2.3161966421984634}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9541429786165232, "4": 0.044865080677756415, "3": 0.0009399762020394628, "2": 2.720061430975213e-05, "1": 0}, "score": 4.953172205436911}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9341560431071635, "4": 0.06510879103138374, "3": 0.0006966957891079033, "2": 1.531577829253743e-05, "1": 0}, "score": 4.933450329144875}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952089180243925, "4": 0.004769906862279906, "3": 1.804407828258644e-05, "2": 4.160809517764299e-07, "1": 0}, "score": 4.995192743686818}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973346812859741, "4": 0.002647837526107406, "3": 1.0613603824544625e-05, "2": 2.313983853396669e-07, "1": 0}, "score": 4.997330223353954}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7868660172306845, "3": 0.1464145642237951, "4": 0.03239821338961756, "1": 0.03143282656955894, "5": 0.0028757292060680147}, "score": 2.1884077352927656}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9304635743362775, "4": 0.06697057065783145, "3": 0.002333838364701962, "2": 0.00019477412580255226, "1": 2.1535410018635576e-05}, "score": 4.9276901528168935}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9989457143500442, "4": 0.001043644880671728, "3": 6.8535143051539756e-06, "2": 1.2420219431630532e-07, "1": 0}, "score": 4.998942271609621}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5051009341874204, "3": 0.3127473821793388, "2": 0.13413050970410784, "5": 0.04057916992772748, "1": 0.007434507068926665}, "score": 3.4372630283323127}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4977604359547305, "5": 0.4957706789481642, "3": 0.006273878092430827, "2": 0.0001816461489331343, "1": 9.776236147362623e-06}, "score": 4.489105933108136}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5170476874220854, "3": 0.3542420296103853, "4": 0.08920700598925813, "1": 0.03228233184875517, "5": 0.006988739975507861}, "score": 2.5214610156021076}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6147556974592188, "3": 0.24098345483140388, "4": 0.10507685964336327, "1": 0.032306849900969714, "5": 0.006228183884479259}, "score": 2.437798987397497}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9936362211587795, "4": 0.006251153326611308, "3": 6.028784801476919e-05, "1": 1.0644183129986314e-05, "2": 0}, "score": 4.993585426798937}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9932310303848868, "4": 0.006708133054641608, "3": 5.719889373858925e-05, "2": 1.741604052753324e-06, "1": 8.383057049045812e-07}, "score": 4.993168883897243}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9790778712409804, "4": 0.02076809425496067, "3": 0.00012482023197299023, "2": 4.89413504173002e-06, "1": 0}, "score": 4.978967071352262}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"5": 0.325408845858002, "1": 0.21945352502028123, "2": 0.18308770109201622, "4": 0.17610226527339348, "3": 0.09560243390419125}, "score": 3.204995976382434}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3629837904942977, "4": 0.2767514688250187, "3": 0.21621940996183345, "2": 0.12965092920455093, "1": 0.014157900096267995}, "score": 3.844952152798833}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9052502356695445, "4": 0.09404082335298199, "3": 0.0006799891607463933, "2": 1.1387503363619718e-05, "1": 0}, "score": 4.9045633595363745}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974088014655862, "4": 0.0025866189003116154, "3": 4.159590192341688e-06, "2": 1.7068825746373082e-07, "1": 0}, "score": 4.997404549207342}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4781971279192988, "3": 0.39795680887541324, "4": 0.09944964930830873, "1": 0.014649890762961505, "5": 0.009736155030453018}, "score": 2.6114210210968967}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4748345744126713, "3": 0.2688098571662804, "1": 0.24053667650575403, "4": 0.012631512439837235, "5": 0.0030128000001849444}, "score": 2.0625855316900377}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.46987898319320937, "2": 0.37082042618828015, "3": 0.14875208765491382, "4": 0.005775075205856152, "5": 0.004654880685747335}, "score": 1.7043528488265443}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6866459336747547, "4": 0.27075278687144855, "3": 0.03972097473302099, "2": 0.002051343160782855, "1": 0}, "score": 4.643355589673414}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978073087672864, "4": 0.0021259564154533853, "3": 3.470898398689442e-05, "2": 1.968418754915159e-06, "1": 0}, "score": 4.997798654193544}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9842911712101197, "2": 0.015385496485162901, "3": 0.000305635910315037, "5": 8.977177810903102e-06, "4": 0}, "score": 1.0160328168106387}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8797583425156493, "1": 0.11822212603864353, "3": 0.002002675985473677, "4": 1.2066084196186614e-05, "5": 4.53152513834654e-06}, "score": 1.883818246733068}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.725525339732816, "3": 0.20352895483895866, "4": 0.04168915316335929, "5": 0.014665228431924766, "1": 0.014589867471570109}, "score": 2.316313539656702}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.826189428028528, "3": 0.17213708737466682, "4": 0.0011711430983459663, "1": 0.000488356932700378, "5": 1.3676944855334255e-05}, "score": 2.174032101009136}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5069939846788984, "5": 0.4651684085673899, "3": 0.024347361320173826, "2": 0.003250178373476353, "1": 0.0002182247637372736}, "score": 4.433675488677585}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.41964915585527657, "3": 0.3186117188033881, "2": 0.24408035112732687, "5": 0.013007534662429788, "1": 0.004641962730134575}, "score": 3.192301732541376}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"4": 0.41184844057200337, "5": 0.3258536254936601, "3": 0.19011260965381327, "2": 0.06341213703355333, "1": 0.008294604796957783}, "score": 3.984025282162266}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8553042973761824, "4": 0.13894024921931938, "3": 0.005578072457445814, "2": 0.00016213471406350557, "1": 1.2580469326939569e-05}, "score": 4.849366478292922}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5465051761257821, "4": 0.43358960623684106, "3": 0.019448171959360015, "2": 0.00044315391958153213, "1": 1.0689944764135765e-05}, "score": 4.526140311096208}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9261569743186348, "4": 0.0677344951017669, "3": 0.00567372562672078, "2": 0.0003961213318809408, "1": 3.5086223409317436e-05}, "score": 4.919589055485375}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.970931838863239, "4": 0.02847064279415305, "3": 0.0005711932295716247, "2": 1.780669585093705e-05, "1": 0}, "score": 4.970333297945805}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6787471341429971, "2": 0.31658674472154336, "3": 0.0046081859623043064, "4": 4.502169829833746e-05, "5": 8.288815350945332e-06}, "score": 1.325972844515865}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8847412408029794, "3": 0.09702770720284604, "5": 0.011483182560344968, "2": 0.00671923211216061, "1": 1.4482000854403916e-05}, "score": 3.900972163359817}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7001777693261012, "5": 0.20314091057115544, "3": 0.0955327460206786, "2": 0.0011239999185219593, "1": 1.2796933321518033e-05}, "score": 4.1053230143268555}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8165254560675399, "5": 0.14953224855729227, "3": 0.03333900653812919, "2": 0.0005717690539213306, "1": 0}, "score": 4.115053330367341}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9319919795188918, "5": 0.037311973443346795, "3": 0.03050704007112418, "2": 0.00018312400713427413, "1": 3.4677797856834365e-06}, "score": 4.006428297544091}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8771622745782129, "3": 0.06719252988887221, "1": 0.05236834359926963, "4": 0.00286166973809746, "5": 0.0004140830501625237}, "score": 2.021789798866442}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.978844926398269, "4": 0.020698859020760258, "3": 0.0004131724490395538, "2": 3.0373015250066833e-05, "1": 8.792578891924258e-06}, "score": 4.978348422786684}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.38827625316970416, "3": 0.3386172721837755, "5": 0.17229619831967533, "2": 0.09744256027163786, "1": 0.003358510858912381}, "score": 3.6287148552632487}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996041982501873, "4": 0.0003946941092630819, "3": 9.126612999889973e-07, "2": 1.7942026981367077e-08, "1": 0}, "score": 4.999603426671848}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6809676688165199, "4": 0.26067725701381267, "3": 0.04264165442676568, "2": 0.011400916865699549, "1": 0.00429688473103743}, "score": 4.602642938630743}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7730017859371778, "4": 0.20287054758113354, "3": 0.02315174785509439, "2": 0.0008450717694106667, "1": 0.00012484320100875966}, "score": 4.747789854413412}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995660872673711, "4": 0.00043066492776300025, "3": 2.019523430259694e-06, "1": 1.9246779421393468e-07, "2": 0}, "score": 4.999564525703129}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8810774019334366, "4": 0.11470759968268446, "3": 0.004154629601064136, "2": 5.1249586923884755e-05, "1": 8.39923439265833e-06}, "score": 4.876795706714497}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9020284936554406, "4": 0.09614959683883278, "3": 0.0017946066814882667, "2": 2.1985684960633088e-05, "1": 3.5403675801805567e-06}, "score": 4.900180893917225}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9889932741893412, "4": 0.010794602913394336, "3": 0.00020434986675444073, "2": 4.212084087912346e-06, "1": 2.776867678101817e-06}, "score": 4.988772944827224}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7690417266694466, "1": 0.2233914869125359, "3": 0.007495930542730731, "4": 5.145021072338443e-05, "5": 1.777189999529333e-05}, "score": 1.784260307283762}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5780655548762702, "5": 0.31969204689527975, "3": 0.10207239117767457, "2": 0.00016813236531545094, "1": 1.8752717044503762e-06}, "score": 4.217277765044483}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9942461555353274, "4": 0.005654846013133056, "3": 8.195944550916511e-05, "2": 1.791771074817134e-06, "1": 0}, "score": 4.994175770979235}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9853850632941457, "4": 0.013866672218645787, "3": 0.0007324129966733673, "2": 9.616751809916326e-06, "1": 5.831221848838304e-06}, "score": 4.984616320437609}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4506440938106634, "3": 0.2950242861791211, "2": 0.188241625377162, "5": 0.06250880826061166, "1": 0.0035678789193497786}, "score": 3.3802893877992153}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7880141755574178, "3": 0.20386921371021405, "4": 0.006064282774806426, "1": 0.0018896417842819912, "5": 0.00013615018228380145}, "score": 2.214522280583702}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5783107991697594, "3": 0.3361631403828803, "2": 0.05510314976158585, "5": 0.02991994392625829, "1": 0.0004713641124878224}, "score": 3.582123205669911}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6895358285566333, "5": 0.20825008287001878, "3": 0.09341185636447202, "2": 0.008445381120660124, "1": 0}, "score": 4.097982429400783}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4114435702924582, "4": 0.38482724487779724, "2": 0.1642714067205097, "5": 0.03514746791070607, "1": 0.003978256185682222}, "score": 3.2829882289843573}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.682111776095323, "3": 0.18446294053249782, "5": 0.11399579696447336, "2": 0.01891357236664841, "1": 0.00033040710906776584}, "score": 3.8906942133903533}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4928264476903958, "3": 0.3775670538401791, "4": 0.060145310681971216, "1": 0.04299088768705964, "5": 0.026281053464525424}, "score": 2.53381096984087}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9925794671188376, "4": 0.007335307103713825, "3": 6.846170637733414e-05, "2": 6.445811615637664e-06, "1": 0}, "score": 4.992508354747946}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9662595746964764, "4": 0.033452498554354594, "3": 0.0002600311828764703, "2": 5.879798884235475e-06, "1": 0}, "score": 4.96600905134642}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9242007260018716, "4": 0.07375918124890916, "3": 0.001786381345505227, "2": 0.00016640116972575162, "1": 5.850583880936067e-05}, "score": 4.921932580510864}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.970928014370258, "4": 0.028210261055651727, "3": 0.0007600581609851088, "2": 6.553809377674053e-05, "1": 2.4980825684251414e-05}, "score": 4.969972750309736}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8233798842925083, "3": 0.15878684081611055, "1": 0.014974871739384126, "4": 0.002241169166394673, "5": 0.000615725260255366}, "score": 2.1501417097128854}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.45908575330450246, "5": 0.36943990149842476, "3": 0.15545689319093728, "2": 0.015063454506694302, "1": 0.0009440352985368559}, "score": 4.181025796813845}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6791521819179717, "4": 0.18726712602863746, "3": 0.12823452050917913, "2": 0.005040973806435418, "1": 0.0002933603033934218}, "score": 4.539962024650777}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.6352184966893606, "4": 0.21468178865112014, "2": 0.11695889859060503, "5": 0.03216814827510803, "1": 0.0009697095153770501}, "score": 3.1601202412602327}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.8424941082122115, "1": 0.1483837730873672, "3": 0.009075775027486098, "4": 2.2276683710760345e-05, "5": 2.0993199626369004e-05}, "score": 1.8607991070321628}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9898849032060264, "2": 0.009880597434219339, "3": 0.00020697273258875307, "5": 6.195845940913517e-06, "4": 0}, "score": 1.0103195464071473}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5955472489555745, "4": 0.21264803454520556, "3": 0.13220273016502462, "2": 0.05444913041883626, "1": 0.00493088398351551}, "score": 4.339729016308385}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8045931363619804, "4": 0.18564309364382195, "3": 0.009634686647106405, "2": 0.0001133692916590573, "1": 1.009540689928391e-05}, "score": 4.794705890083942}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6535361695582312, "3": 0.22190158637844287, "5": 0.11350216129446485, "2": 0.010935396125946753, "1": 0.0001121568746690283}, "score": 3.869391675548084}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4938816822977128, "4": 0.4934777289011444, "3": 0.01208712309590174, "2": 0.00044008199330157754, "1": 0}, "score": 4.480968929257735}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.658942962380572, "2": 0.33903307838670116, "3": 0.0019671706241442743, "4": 2.4194263460222035e-05, "5": 1.766901530718719e-05}, "score": 1.343115799603073}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959469339336572, "4": 0.004044098585121542, "3": 7.342251635867789e-06, "2": 1.4439185758399727e-07, "1": 0}, "score": 4.995940777724984}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7253702535034456, "5": 0.19551917940406824, "3": 0.07731749677784154, "2": 0.001744686143435501, "1": 0}, "score": 4.114717860867977}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9192323402747274, "4": 0.08033143219998326, "3": 0.0004336113205066962, "2": 1.9665693106605195e-06, "1": 2.918949090416987e-07}, "score": 4.918794248820844}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9885226659435505, "4": 0.011401686453561282, "3": 7.403919076639705e-05, "2": 8.379210108800617e-07, "1": 4.617935071496589e-07}, "score": 4.9884458706611134}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9530780170387676, "1": 0.03739901544156526, "3": 0.009374834130770442, "4": 0.00012155666807581475, "5": 2.4109177037789165e-05}, "score": 1.9722911911837713}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.998613230554652, "4": 0.0013231627308698912, "3": 5.8273681428966614e-05, "2": 2.8197904056895436e-06, "1": 1.464770475182493e-06}, "score": 4.998545969928645}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.996745952326749, "4": 0.0032186296002481105, "3": 3.0581692878085775e-05, "2": 7.599075924045126e-07, "1": 0}, "score": 4.996717913911886}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997182045118091, "4": 0.00027959539994809254, "3": 1.6969042438972803e-06, "2": 4.0688351068427957e-08, "1": 0}, "score": 4.999716888595573}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995096401657008, "4": 0.0004859593886518837, "3": 3.555577715627337e-06, "1": 2.056251471096831e-07, "2": 0}, "score": 4.99950610663961}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8734139377678615, "1": 0.10729612968857322, "3": 0.01902582142656673, "4": 0.000209668677365372, "5": 5.428986482061528e-05}, "score": 1.9123118853081884}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.477611355984233, "3": 0.46767723022914987, "4": 0.05243811849109768, "1": 0.0011409242493592502, "5": 0.0010641300160417386}, "score": 2.5746441473186756}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5233341284384013, "5": 0.46656429685164785, "3": 0.00964279475530614, "2": 0.000427360345564557, "1": 1.6821428136141472e-05}, "score": 4.4560229742266975}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.41223533139284035, "2": 0.36738824566632233, "4": 0.1917844104645852, "5": 0.018060988468788643, "1": 0.010496273390567577}, "score": 2.8395200181763376}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4810411315280671, "2": 0.24977324317951044, "4": 0.2147216802332647, "5": 0.046492033669549994, "1": 0.007146830551958227}, "score": 3.0436748785943526}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.478939372769746, "4": 0.32353855218781324, "2": 0.14835774885595948, "5": 0.04827654727077181, "1": 0.000838646730800659}, "score": 3.270069873534761}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5188476417962304, "4": 0.4724675271587492, "3": 0.008528487061280433, "2": 0.00013996166419934548, "1": 0}, "score": 4.5100475871691055}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5406367864541259, "4": 0.4494166502328074, "3": 0.009718626277238077, "2": 0.0002043719377318617, "1": 0}, "score": 4.530521918102466}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983594894109978, "4": 0.0016283245113004384, "3": 8.64442459782682e-06, "2": 3.3803344386909187e-07, "1": 0}, "score": 4.998353367263987}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9566653951585732, "4": 0.0428814348839831, "3": 0.0004361819871425506, "2": 1.0266822276148577e-05, "1": 0}, "score": 4.956215106390152}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6616183962241438, "5": 0.2904350522428372, "3": 0.040466896883193736, "2": 0.006861309268420811, "1": 0.0004647554057072622}, "score": 4.23488734694759}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6495499763176641, "3": 0.33464292873129553, "4": 0.013121804064538974, "1": 0.002358270895211785, "5": 0.00032218971786680193}, "score": 2.3594965715854976}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6848540356968658, "4": 0.3076041038268346, "3": 0.00726542125115097, "2": 0.00015196580948787793, "1": 0}, "score": 4.6773689972594905}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6582423120836092, "4": 0.3091811586276157, "3": 0.02891596541197628, "2": 0.0030215458732527076, "1": 0.0005541772369992086}, "score": 4.621673466467566}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.464692817137056, "5": 0.4170543624886444, "3": 0.08779581891790143, "2": 0.017042892914719845, "1": 0.013317424345802915}, "score": 4.255245162877218}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6078507403497969, "2": 0.3593115282760958, "4": 0.031281284486553686, "1": 0.000791584282333153, "5": 0.0007646935443641578}, "score": 2.6719159192683444}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.814994935394875, "4": 0.13538655795272084, "3": 0.038518986631181105, "2": 0.009954694798972338, "1": 0.001022539540887901}, "score": 4.753591093943476}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9647792020394632, "4": 0.03486873487988241, "3": 0.00032093209476524135, "2": 4.396296834196289e-06, "1": 0}, "score": 4.964475262297268}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9450533424919899, "4": 0.053541790455183924, "3": 0.0013450124627313491, "2": 4.870957184808476e-05, "1": 7.347598741168877e-06}, "score": 4.94359245130572}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.42224933423651245, "5": 0.30887472654485604, "3": 0.23702221691100683, "2": 0.03082583937407355, "1": 0.0010030515254357655}, "score": 4.0071918548932794}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"2": 0.45050937136862285, "3": 0.3511214865055365, "1": 0.12634286713078585, "4": 0.051885443510978735, "5": 0.020134186253950033}, "score": 2.3889546498517147}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6026949243791868, "4": 0.16972544108095713, "2": 0.16951773946961737, "5": 0.03383642479809449, "1": 0.024221916867411424}, "score": 3.0194367865394756}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6219163380700861, "4": 0.35933736370375136, "5": 0.015584252962818278, "2": 0.0031536934159535216, "1": 7.3661454058435e-06}, "score": 3.387337825722286}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9336897074075505, "4": 0.06290326555560957, "3": 0.003344252761644594, "2": 5.463985480541593e-05, "1": 7.730051755344268e-06}, "score": 4.930213360930137}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5809632367208245, "5": 0.3761268370109948, "3": 0.04221144441662732, "2": 0.0006568578008289475, "1": 3.805481262696172e-05}, "score": 4.332488699286161}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6549645283527313, "3": 0.27825508891250383, "4": 0.05399563872669172, "1": 0.007072317919335897, "5": 0.0057111035944785}, "score": 2.396307883344887}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9967329265370589, "4": 0.0031972145543666453, "3": 6.335308212831198e-05, "2": 2.674858703855446e-06, "1": 1.7696885275486169e-06}, "score": 4.996660969068481}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9907473793821263, "4": 0.009080077056556893, "3": 0.0001608222242917576, "2": 4.734603845402805e-06, "1": 0}, "score": 4.990584008896305}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9826865160862471, "4": 0.017014262773534742, "3": 0.0002840665546212997, "2": 9.447040878932185e-06, "1": 2.706968997805553e-06}, "score": 4.9823783822435965}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9524170779893599, "4": 0.044736202760599246, "3": 0.0025670333124142236, "2": 0.000234375272165689, "1": 3.575601683173577e-05}, "score": 4.9492830961485526}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8876491370531246, "1": 0.11053394617484154, "3": 0.0018097137416437771, "4": 5.179406932722374e-06, "5": 0}, "score": 1.8912859063842777}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6885801466245205, "5": 0.2610227788970764, "3": 0.04939460852077248, "2": 0.0009260666959943606, "1": 0}, "score": 4.209792064943174}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5318001330421338, "4": 0.4617328970518616, "3": 0.006373288465396624, "2": 8.559531565247605e-05, "1": 3.048475281638361e-06}, "score": 4.525249154540819}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.4672506694045402, "4": 0.4306838864887664, "2": 0.0772786544956514, "5": 0.024525619841173425, "1": 0.0002598941825458523}, "score": 3.401937196016362}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5538060188669408, "3": 0.26131920794278574, "5": 0.10320162292921942, "2": 0.08091045739866173, "1": 0.0007590856052788162}, "score": 3.6777830810540006}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9210679011343083, "1": 0.07802727764738661, "3": 0.0008991639237630183, "4": 2.6646202654799924e-06, "5": 0}, "score": 1.9228769847128435}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6782371862443225, "3": 0.2919316148094604, "4": 0.0235228544651839, "1": 0.004502114966780097, "5": 0.001799013895554384}, "score": 2.3398747028659725}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.599522142650395, "5": 0.3817953526405136, "3": 0.018146174714787956, "2": 0.0005155652429768015, "1": 9.65803834728995e-06}, "score": 4.362593100542226}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5307258399600541, "5": 0.3330014615407712, "3": 0.1210242911775765, "2": 0.014947975595300757, "1": 0.00029056536452844026}, "score": 4.181211310975359}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8772942711161792, "3": 0.06089925119442038, "5": 0.059796927436865814, "2": 0.001997554093679313, "1": 1.1733013768950943e-05}, "score": 3.9948673676631525}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5177574964045301, "1": 0.4397789784412875, "3": 0.04194797160163218, "4": 0.0003216482502632609, "5": 0.00016483806338759066}, "score": 1.603295272739954}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5561821113284566, "3": 0.3674744450595491, "1": 0.06674895081183943, "4": 0.008557809680647392, "5": 0.0010348094246416218}, "score": 2.320946143238071}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8465924491196462, "4": 0.1489421654096651, "3": 0.0044164962538339285, "2": 3.6162712913204596e-05, "1": 7.445833081268337e-06}, "score": 4.842085736718354}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978145386058962, "4": 0.0021611156197423004, "3": 2.3113839668238494e-05, "2": 5.745699436906662e-07, "1": 3.68027195754967e-07}, "score": 4.997789460242715}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.45915400606569073, "4": 0.4051301117052109, "3": 0.11756475392055529, "2": 0.00978936584822446, "1": 0.008285419464456673}, "score": 4.297176949433936}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.28306990435108825, "1": 0.2589799068556437, "5": 0.2292964663120499, "4": 0.11488633852747211, "3": 0.11337755896462609}, "score": 2.7723608136458524}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.9886352077467573, "2": 0.010789297590757259, "5": 0.00028523361834101096, "3": 0.00025900427256780737, "4": 2.7883289255382335e-05}, "score": 1.0125319327532767}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.42792007563877893, "4": 0.27625119510157076, "3": 0.18019640212810153, "2": 0.10033860126272713, "1": 0.015288337441135186}, "score": 4.001181465028057}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.8633758215647298, "2": 0.1324461673847765, "3": 0.00286987587291876, "5": 0.0011345592834218733, "4": 0.00017332172646516219}, "score": 1.1432441578517332}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830719580714034, "1": 0.013509042539834938, "4": 0.0022218613243407356, "3": 0.0007771669234301478, "2": 0.00041589310078171324}, "score": 4.940939714516895}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8723852606252418, "1": 0.10853690777709857, "3": 0.018815219288912593, "4": 0.00020859603984953084, "5": 5.3832563735868474e-05}, "score": 1.9108569849066883}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5879921156099646, "3": 0.37925339838098915, "4": 0.030241721541766353, "1": 0.0016234402017863974, "5": 0.000862023521974025}, "score": 2.4407115035803835}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6057366247548608, "2": 0.3597163049520519, "4": 0.03340609535470291, "1": 0.0008362047990005322, "5": 0.0002991941093676822}, "score": 2.6726139435089076}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.6770266784349392, "3": 0.29767946267134643, "4": 0.01545444677341885, "1": 0.009181483372364829, "5": 0.0006276840645569032}, "score": 2.32129964264545}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6618769873663759, "3": 0.2609845940578129, "1": 0.04523068729734249, "4": 0.02762740677119548, "5": 0.003055852727812271}, "score": 2.280519767024601}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8073550376007826, "2": 0.11201080938253463, "4": 0.06740864535012425, "5": 0.007751969026121622, "1": 0.005465250616183871}, "score": 2.959970941025654}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.42196328968409597, "2": 0.4212917889418231, "1": 0.15074748903466964, "4": 0.004741171603895269, "5": 0.0012541189309507707}, "score": 2.284461109910173}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.9357450744098667, "4": 0.03224896916910142, "2": 0.02885484968947972, "5": 0.0029768181017730015, "1": 0.00017328515943883493}, "score": 3.009001194396722}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5552514526511703, "2": 0.371077775826273, "1": 0.06380634769043914, "4": 0.00932066780457673, "5": 0.0005397011486661461}, "score": 2.511707618928297}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.693706478210743, "2": 0.2576099138628644, "1": 0.025721059161446902, "4": 0.02112740217030194, "5": 0.0018341271100458213}, "score": 2.715743334409343}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7525727569923296, "2": 0.24573039483596795, "3": 0.001674303033000172, "4": 1.0236098672104252e-05, "5": 0}, "score": 1.2491127755371108}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8733410194822134, "4": 0.1252671653130316, "3": 0.0013161640444635167, "2": 6.488779568074267e-05, "1": 6.702359026702846e-06}, "score": 4.8718785134728195}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8262857094923067, "4": 0.16860718814689135, "3": 0.004656021271231358, "2": 0.0003722076725191087, "1": 0}, "score": 4.82095002400966}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.537471507332141, "4": 0.44076315997956983, "3": 0.019654206349252773, "2": 0.001915384295463718, "1": 0.00010663326931890055}, "score": 4.513712408867077}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.872504864118655, "4": 0.12173489383434498, "3": 0.0048558554158448005, "2": 0.000824170361525804, "1": 5.25002303897571e-05}, "score": 4.865867165696931}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"3": 0.484821837933098, "4": 0.4328203903158066, "2": 0.057695246031361586, "5": 0.02413233588125366, "1": 0.0005284058046729125}, "score": 3.4223337578953084}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8282025739424888, "3": 0.16443081084842373, "1": 0.005159939625714721, "4": 0.002058397935419125, "5": 0.00014809257100019944}, "score": 2.163831975128071}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9116921962381286, "4": 0.08372523947911643, "3": 0.004469440705487162, "2": 9.338498367618243e-05, "1": 1.6707371980294e-05}, "score": 4.906988612732832}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6518489276250748, "3": 0.2674952954241959, "5": 0.0674306578661788, "2": 0.012743792355726865, "1": 0.00047723978474413183}, "score": 3.773015130701829}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8559865633368371, "5": 0.09353984347818944, "3": 0.048780057862595344, "2": 0.0016596575385088388, "1": 3.33111627311147e-05}, "score": 4.041340560474819}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8767016573043729, "4": 0.07281526221075263, "1": 0.028020040294842164, "3": 0.015371209996029884, "2": 0.006870758989700995}, "score": 4.7636976400014115}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9979137786910524, "4": 0.0020634684467915193, "3": 1.6602471303127223e-05, "2": 9.994766949361563e-07, "1": 0}, "score": 4.997900317365232}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9802743034529787, "4": 0.019360811145500763, "3": 0.00035118092902442134, "2": 6.332319241814329e-06, "1": 0}, "score": 4.979917681988799}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9740385870791066, "4": 0.025419774099077235, "3": 0.0004785140427796566, "2": 1.3412117078691238e-05, "1": 0}, "score": 4.9735816481375315}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6965506553353773, "4": 0.2971221040264042, "3": 0.006052099756277219, "2": 0.00022225593050261352, "1": 3.2886642028866286e-05}, "score": 4.689969182009194}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9939676481381015, "2": 0.005907203739824668, "3": 0.0001099100779134093, "5": 3.645048086993009e-06, "4": 0}, "score": 1.006141675288417}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.3872795636715042, "3": 0.3235712312318481, "5": 0.23866430404294564, "2": 0.05024966996124218, "1": 0.00021460552124996762}, "score": 3.813946078856464}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8045931363619804, "4": 0.18564309364382195, "3": 0.009634686647106405, "2": 0.0001133692916590573, "1": 1.009540689928391e-05}, "score": 4.794705890083942}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5687060707168795, "5": 0.24113252508764424, "3": 0.18611397948867517, "2": 0.003994303731238445, "1": 5.044302885493516e-05}, "score": 4.04687873458868}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5816085802701516, "3": 0.24742254387354792, "5": 0.11582312917257855, "2": 0.05296431998321763, "1": 0.002079966273632766}, "score": 3.7562073112014236}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9507689316876948, "4": 0.04860739009828936, "3": 0.0006180369578181055, "2": 4.603107219522303e-06, "1": 7.856259880041137e-07}, "score": 4.95013957156956}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4732289829101721, "4": 0.34210197973794193, "3": 0.16828405900627394, "2": 0.015464766060318966, "1": 0.0007912196043241201}, "score": 4.271676777286146}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8310699433325969, "4": 0.16626408187928163, "3": 0.0026331579807054033, "2": 2.6555199271855292e-05, "1": 3.4104237756708267e-06}, "score": 4.828375805534168}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.924119885079196, "4": 0.07294786288907787, "3": 0.002829169707358835, "2": 7.62950116441877e-05, "1": 0}, "score": 4.921162800824563}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.759391564012317, "4": 0.2277941975452513, "3": 0.012510906438673884, "2": 0.00027675054972997327, "1": 2.269415853165746e-05}, "score": 4.746261974939403}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8300611551518123, "2": 0.16982465761697293, "3": 0.00011261017299784663, "4": 2.50023980921137e-07, "5": 0}, "score": 1.1700508536982162}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.798459326505601, "4": 0.18763796327677934, "3": 0.012388887221569821, "2": 0.0013088387307342076, "1": 0.00019884717362794445}, "score": 4.782861024791568}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8668914169588184, "4": 0.12770293916982703, "3": 0.005156367088842282, "2": 0.00018992163846645344, "1": 0}, "score": 4.8614063354901695}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8130598466727202, "4": 0.17943151067374366, "3": 0.006336591965093581, "2": 0.0008687809811202374, "1": 0.0001618073706982718}, "score": 4.804614093222998}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.951085533397573, "4": 0.0324643180156123, "3": 0.008056583465374766, "1": 0.006766722029070095, "2": 0.0016217718384235085}, "score": 4.919489903134941}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"2": 0.659546830663563, "3": 0.3307818117374622, "4": 0.008014921396644208, "1": 0.001405307695243719, "5": 0.00025018773047570393}, "score": 2.346157235683565}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.799332815415689, "4": 0.19100012432872232, "3": 0.009506813755941352, "2": 0.00015302748686424038, "1": 5.769916205461868e-06}, "score": 4.78950378100463}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9470357932952814, "4": 0.0524182062752639, "3": 0.0005187222405728057, "2": 1.7125944877664754e-05, "1": 0}, "score": 4.946492428187033}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986373590394361, "4": 0.0013578088747411396, "3": 4.734331613508442e-06, "2": 3.9127785333008574e-08, "1": 0}, "score": 4.998632604998511}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.878543162955673, "4": 0.11825062100452431, "3": 0.0031153483597811814, "2": 6.311109322412098e-05, "1": 0}, "score": 4.875325888468443}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7894651800965111, "4": 0.20819750636215756, "3": 0.0022778674560505223, "2": 5.120358545257898e-05, "1": 0}, "score": 4.787091393070227}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9741587100019965, "4": 0.02527091119152559, "3": 0.0005406933286554706, "2": 2.2188553725562572e-05, "1": 5.996143772156304e-06}, "score": 4.9735571122299325}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9986935900973654, "4": 0.0013021099392661857, "3": 2.6141619233954466e-06, "1": 0, "2": 0}, "score": 4.99869265953297}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993646087465704, "4": 0.0006341128642809706, "3": 9.93555413962677e-07, "1": 0, "2": 0}, "score": 4.999363899843709}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6999056491163193, "4": 0.29380799594701074, "3": 0.006096244214295794, "2": 0.00017645970640085823, "1": 1.1055118771742556e-05}, "score": 4.693425120193236}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9993477037377674, "4": 0.0006497130851403066, "3": 2.450464400857062e-06, "2": 4.660388174663449e-08, "1": 0}, "score": 4.9993452461180325}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.961368051788163, "4": 0.037821365922399555, "3": 0.0007951558697095115, "2": 1.3454095501685965e-05, "1": 1.4807127474481673e-06}, "score": 4.96054201780269}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9970904754944127, "4": 0.0028536588530238367, "3": 4.647253802219372e-05, "2": 2.774200390100325e-06, "1": 0}, "score": 4.9970450539112266}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994774860579808, "4": 0.0004993661318997076, "3": 1.3973093086563178e-05, "1": 5.7221153757737995e-06, "2": 0}, "score": 4.999449797320793}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9991311947300391, "4": 0.0008587658994119837, "3": 7.900432919942832e-06, "1": 2.2259341071569376e-07, "2": 0}, "score": 4.999124541183424}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7160113000165562, "4": 0.2697227768129154, "3": 0.012874297461734421, "2": 0.0010496832783308601, "1": 0.0002710430211643559}, "score": 4.700274155958673}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6857519812473661, "4": 0.2993303996858913, "3": 0.01347602632455392, "2": 0.0012082086148104013, "1": 0.0001783725887728847}, "score": 4.669361242518707}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918986195044851, "4": 0.008051144691169394, "3": 4.77507397027717e-05, "2": 1.132046501458567e-06, "1": 0}, "score": 4.991849946662751}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8793108177402439, "4": 0.11694830259439859, "3": 0.00361450847790616, "2": 8.828953268675032e-05, "1": 2.1855345959717034e-05}, "score": 4.8754683697792025}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7869823010134663, "4": 0.20027332908880388, "3": 0.011959566224163906, "2": 0.0006331125167729564, "1": 0}, "score": 4.773873899582796}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4166837659149765, "4": 0.3818231865362543, "2": 0.13561067261130447, "5": 0.06336927224071105, "1": 0.0024841607570403198}, "score": 3.367993387334723}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8979962828982769, "3": 0.05755631610308012, "1": 0.042979286012189345, "4": 0.0013084928503677778, "5": 0.00015921174693436126}, "score": 2.0176716582846863}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9639311038123048, "4": 0.034343070940734924, "3": 0.0016697895140301892, "2": 4.214409408251408e-05, "1": 0}, "score": 4.962190392511546}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7063744780117635, "4": 0.2696228360719917, "3": 0.02088169377010053, "2": 0.0029722144438565244, "1": 0.00014636486183989918}, "score": 4.679110899354676}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.9043842803788498, "3": 0.06997914569235548, "1": 0.02343654553314255, "4": 0.0019714085336825786, "5": 0.00021799531199859787}, "score": 2.051139946501491}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5817864051922947, "3": 0.2717976563507568, "5": 0.13503989846811973, "2": 0.011329129934074622, "1": 4.360948000223981e-05}, "score": 3.840452627211177}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6469246188509821, "2": 0.3033080873862513, "4": 0.040602038673585576, "5": 0.007243092665861263, "1": 0.0019217885309645657}, "score": 2.747936465312499}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6891260075513029, "4": 0.28946392532787474, "3": 0.02083935526407431, "2": 0.0005553477854636237, "1": 1.2067858040937851e-05}, "score": 4.667141952184316}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998909793831794, "4": 0.00010800910811476793, "3": 9.234658655839757e-07, "2": 1.908242657556488e-08, "1": 0}, "score": 4.999890086705295}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9685272763804237, "4": 0.026493104166107093, "3": 0.004660451253583037, "2": 0.0002530427781330299, "1": 0}, "score": 4.963424446418421}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5433007744337696, "2": 0.31821710787144475, "4": 0.13274778559714623, "5": 0.004285881630589775, "1": 0.0014386688538075992}, "score": 2.8202233447735545}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5147455129820206, "4": 0.4447789330120679, "5": 0.020587584068782763, "2": 0.01981875831748751, "1": 5.565119538834594e-05}, "score": 3.466030360010766}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6062760552027114, "4": 0.3888464279785513, "3": 0.004828720274228189, "2": 3.599015964743541e-05, "1": 0}, "score": 4.601383056152055}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8690764785950024, "4": 0.12452858388390982, "3": 0.00587979724387685, "1": 0.0002693340842656874, "2": 0.00022883439087171756}, "score": 4.86194563908737}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5409731941875073, "5": 0.3832030398937549, "3": 0.06725136253244043, "2": 0.008016967867297636, "1": 0.00035259657556560673}, "score": 4.29892058463558}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6038093660427764, "3": 0.2874349514990162, "5": 0.09198843650461465, "2": 0.01658495367124577, "1": 0.00018064243099052393}, "score": 3.770841272292298}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9844828116690078, "4": 0.015153435606947506, "3": 0.00033815415045940645, "2": 8.14011703735296e-06, "1": 0}, "score": 4.984145558946952}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.52322658909225, "5": 0.43319296655921474, "3": 0.04218443351681698, "2": 0.001305476722914173, "1": 6.223027128500463e-05}, "score": 4.388221876951641}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5904232655812394, "4": 0.40207729207544934, "3": 0.007312444910934196, "2": 0.0001615528862286103, "1": 1.6290165105693428e-05}, "score": 4.582744179064797}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982564867881394, "4": 0.0017257378169049787, "3": 1.2889893542099485e-05, "1": 1.2588738581733264e-06, "2": 0}, "score": 4.998243440530191}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5291429482990354, "3": 0.3622488399981496, "4": 0.09961226294825903, "5": 0.004807845097145662, "1": 0.004164257044280644}, "score": 2.571746278354132}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.3271336421455281, "3": 0.2845077457362213, "4": 0.2728303787932537, "5": 0.10060367411153101, "1": 0.014867457722592172}, "score": 3.1171758603419235}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.506001502667735, "5": 0.4772439945033652, "3": 0.016093223439109156, "2": 0.00062119122044971, "1": 2.9831520158756995e-05}, "score": 4.459823610312337}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7152171329090595, "4": 0.2701131320906081, "3": 0.01434889992491107, "2": 0.00031393393257705016, "1": 5.551541061555635e-06}, "score": 4.700224655520253}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6466118740714997, "4": 0.33528958088537286, "3": 0.01678343316904819, "2": 0.0012158877628328853, "1": 6.132444610404585e-05}, "score": 4.627236464090427}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4846230871845596, "3": 0.2631048386997266, "4": 0.24081860626263335, "5": 0.007740850606021358, "1": 0.003628271191268913}, "score": 2.764400806044821}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9417012491339732, "4": 0.05744042242922348, "3": 0.0006744584401528784, "2": 8.143112394412917e-05, "1": 0}, "score": 4.940960319360309}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8311632361696986, "4": 0.1656294027422905, "3": 0.0030753105221778894, "2": 2.968876103806132e-05, "1": 0}, "score": 4.828113315298973}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9927859864208624, "4": 0.007163676157149973, "3": 3.969054737528397e-05, "2": 1.234208110028212e-06, "1": 0}, "score": 4.992753171911794}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9931468337864086, "4": 0.006773400694061648, "3": 6.437147228102372e-05, "2": 1.9536854398096494e-06, "1": 0}, "score": 4.993091902457727}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9741839390909582, "1": 0.020337201171857534, "3": 0.005449174225739304, "4": 2.529542521809837e-05, "5": 0}, "score": 1.9851624987664078}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9323974320066032, "4": 0.0667072524224958, "3": 0.0008337927397327654, "2": 4.728814160139503e-05, "1": 7.636684614129597e-06}, "score": 4.931452298656705}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8092004965969244, "4": 0.18982294684166365, "3": 0.00091481692012863, "2": 1.571859738211978e-05, "1": 0}, "score": 4.808291440897917}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9653846509916149, "4": 0.03379218892816487, "3": 0.0007703974557430691, "2": 3.983426844219855e-05, "1": 9.392312710704993e-06}, "score": 4.964509818609361}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8290777836179541, "4": 0.15775853096588333, "3": 0.011161599588468728, "2": 0.0015285831780872444, "1": 0.0004345041769810378}, "score": 4.813587233801833}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"4": 0.35417862596188093, "2": 0.29026116276645025, "3": 0.18990061929603383, "5": 0.11423821562978777, "1": 0.05138700291868812}, "score": 3.189626406727109}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4967795066093687, "5": 0.4650666129493916, "3": 0.030590566557109688, "2": 0.006786642071613551, "1": 0.0007679804353083586}, "score": 4.418602459175003}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7960910462241741, "4": 0.19902142435046188, "3": 0.004449770754382845, "2": 0.0003682035307475905, "1": 4.925710188654861e-05}, "score": 4.790773148246324}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9915131275690015, "4": 0.008381825065120632, "3": 6.630282846954582e-05, "2": 5.7631232460104945e-06, "1": 0}, "score": 4.991467998510728}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.923005846742898, "4": 0.07610936194992739, "3": 0.000805181693340852, "2": 6.961914197923521e-05, "1": 7.7812777347533e-06}, "score": 4.922040119898005}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9865580399877568, "2": 0.01337431369553449, "3": 6.542173599860407e-05, "5": 7.905602228185547e-07, "4": 0}, "score": 1.0135083387796575}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4890568493133409, "3": 0.2140438881872901, "5": 0.2140275572616541, "2": 0.0775109083208846, "1": 0.00535306813112056}, "score": 3.8289013256542437}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.505485335921374, "5": 0.37735318494225367, "3": 0.10541727045379361, "2": 0.011304334983176748, "1": 0.00037545009439504304}, "score": 4.248216885265493}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9059888861110444, "4": 0.09229873895740294, "3": 0.0016213383967431593, "2": 7.090181679509406e-05, "1": 1.3232958291943834e-05}, "score": 4.904192285723735}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8377888828608577, "4": 0.15388435503459263, "3": 0.008021402476584708, "2": 0.00026612990599323165, "1": 3.743636499039781e-05}, "score": 4.829124398393344}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4554977508750603, "3": 0.3998587017120485, "4": 0.13526495423647694, "5": 0.00622516083510796, "1": 0.003135185299328883}, "score": 2.685941423792952}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9603221767887501, "4": 0.039089460529562206, "3": 0.0005515552736974988, "2": 1.870293676832017e-05, "1": 0}, "score": 4.959750591418478}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9750722969649867, "4": 0.024611528687269825, "3": 0.00028987667037720167, "2": 1.0362210242674587e-05, "1": 0}, "score": 4.974777229404617}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.821599039030737, "4": 0.1738326020544423, "3": 0.004324178927385087, "2": 0.00021751407432258076, "1": 1.8696672333854147e-05}, "score": 4.816790251135882}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9948157789989902, "4": 0.005118340569420388, "3": 5.705362174344155e-05, "2": 2.4316293765117434e-06, "1": 0}, "score": 4.9947602237896485}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.641210424872554, "4": 0.3280002199562156, "3": 0.027461152757713315, "2": 0.0031686298769441827, "1": 0.00014658867830102}, "score": 4.606980127269995}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954088487050484, "4": 0.00451074026660529, "3": 6.671398212165827e-05, "1": 6.168967969011305e-06, "2": 0}, "score": 4.9953311207495865}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9978271211265606, "4": 0.002155490437742716, "3": 8.656292888160483e-06, "2": 2.9709229168536757e-07, "1": 0}, "score": 4.99782628736423}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982040988637997, "4": 0.0017663235198592136, "3": 1.7383744718010783e-05, "1": 2.4404063393589617e-06, "2": 0}, "score": 4.998189129703087}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9851867065257515, "4": 0.014608865624578186, "3": 0.0001880574606646556, "2": 6.829213805578654e-06, "1": 5.440641942077443e-06}, "score": 4.984972707624995}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.828035972907623, "4": 0.16595818831044795, "3": 0.005541832814465958, "2": 0.0004515628464494595, "1": 1.0884171283326745e-05}, "score": 4.821559642656591}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9951468074812315, "4": 0.004721465690217183, "3": 0.0001096969493603532, "2": 1.3678339974859385e-05, "1": 7.162438946561681e-06}, "score": 4.994989449677305}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9929585003556104, "4": 0.006987675671458402, "3": 5.124938192594703e-05, "2": 9.330220527410499e-07, "1": 0}, "score": 4.992907014854908}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975385553351738, "4": 0.002443331016447719, "3": 1.6197235150725007e-05, "2": 6.406811049473549e-07, "1": 0}, "score": 4.997522349309118}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9567783342611272, "4": 0.04232933222620633, "3": 0.0008621084354728606, "2": 2.5557263397817005e-05, "1": 4.428888093973576e-06}, "score": 4.955852053012201}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4219208380930839, "4": 0.27132310470654675, "3": 0.2534934993169052, "5": 0.04025081608175502, "1": 0.01297870034789605}, "score": 2.9039433242289645}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.614056736733907, "3": 0.31106894601694207, "5": 0.042556758496306545, "2": 0.03143473774351347, "1": 0.0008303942250470014}, "score": 3.6661096495198167}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.46754269884328076, "2": 0.41048717211223923, "4": 0.11595979996090254, "5": 0.003009332456699487, "1": 0.0029907927288910655}, "score": 2.7055067023247132}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7911527340744584, "4": 0.20156170826245165, "3": 0.0071406069445783754, "2": 0.0001166890328943544, "1": 0}, "score": 4.783800900598731}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6162183955819973, "4": 0.3624931867632139, "3": 0.019122234710966128, "2": 0.0019385306301960943, "1": 0.00018033650141855256}, "score": 4.592706134478537}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3939982544594427, "3": 0.3797132562207388, "2": 0.20729482990719808, "5": 0.016251705855384282, "1": 0.0027306426351392647}, "score": 3.213747968679357}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9878324881655768, "4": 0.012080327209055103, "3": 8.473667933884329e-05, "2": 1.6367303421371116e-06, "1": 0}, "score": 4.98774527930002}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9915545022920248, "4": 0.008421932196792437, "3": 2.159270568664279e-05, "2": 5.211312018128757e-07, "1": 0}, "score": 4.991533306707348}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9711641747213797, "4": 0.028416636871427092, "3": 0.0004158753425254514, "2": 2.5731132779556837e-06, "1": 4.6601127865096383e-07}, "score": 4.970742021043638}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4593968709119043, "3": 0.34884733081823716, "2": 0.14969035776775938, "5": 0.038985511573125554, "1": 0.0030685044067837865}, "score": 3.38154488644485}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5565281085601794, "4": 0.3933637471173956, "3": 0.04803356219564902, "2": 0.0019154293075235515, "1": 8.223726608005333e-05}, "score": 4.504455776446339}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8723847110227008, "4": 0.1210698411880436, "3": 0.006046089376410573, "2": 0.0004539429629881508, "1": 2.9766826179216964e-05}, "score": 4.865354976856157}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9816510961476951, "4": 0.017963969887989623, "3": 0.00030115002363261006, "2": 1.0247118641955988e-05, "1": 0}, "score": 4.981401621043136}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.5536798208560506, "4": 0.2870306426805886, "2": 0.07936344556899393, "5": 0.07847579858560536, "1": 0.001345979336043042}, "score": 3.361964593213456}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8193228848715045, "4": 0.1480113528076715, "3": 0.02783072925141032, "2": 0.004581870308100196, "1": 0.00024039431588209427}, "score": 4.781617212092969}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.821682230144918, "4": 0.15176387802676028, "3": 0.025292195730127056, "2": 0.0010699418262253588, "1": 0.0001910103390940946}, "score": 4.793677710187998}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9886073602624313, "4": 0.010959983532198826, "3": 0.00039950531049209425, "2": 1.5671872701907914e-05, "1": 1.1527028222111963e-05}, "score": 4.988147811571669}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.994240614219246, "4": 0.0056351021718746485, "3": 0.00011433863846207347, "2": 1.7009697982486082e-06, "1": 0}, "score": 4.994131069258338}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9855871835408917, "4": 0.013407587512475309, "3": 0.0009784287395438293, "2": 1.8369121177025272e-05, "1": 6.740786152534779e-06}, "score": 4.984553458391011}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982693200567205, "4": 0.001653056963598274, "3": 7.035821555898683e-05, "1": 4.750959311467572e-06, "2": 1.597643223404761e-06}, "score": 4.998182428173178}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5187408480012952, "3": 0.3365148500381227, "2": 0.10569739834341699, "5": 0.03828514948089858, "1": 0.0007373749820383083}, "score": 3.4881508993616612}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5019673506255655, "4": 0.4695657723233252, "3": 0.02548638986721851, "2": 0.0027099583858048435, "1": 0.0002164629839427228}, "score": 4.470437089599162}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.568442474003192, "4": 0.4125796627643732, "3": 0.018470851205333805, "2": 0.00046558773697779997, "1": 0}, "score": 4.54906319187686}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.635979938104743, "4": 0.3600926210242675, "3": 0.0036822341685485787, "2": 0.00022490015720493108, "1": 1.1676713483456291e-05}, "score": 4.631818325967185}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7968230618864565, "4": 0.2002822214220238, "3": 0.00278443471798053, "2": 9.347813493309305e-05, "1": 1.2912147797236307e-05}, "score": 4.793816023741742}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9665184181220612, "4": 0.033033542313243555, "3": 0.0004344650733647986, "2": 9.291881463233472e-06, "1": 0}, "score": 4.966069506584571}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8683610713498686, "4": 0.12639491847699585, "3": 0.004814052663624789, "2": 0.00032127262378533767, "1": 6.151041794612321e-05}, "score": 4.862760642458963}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993480610745897, "4": 0.0006492348774694765, "3": 2.0489973131634525e-06, "1": 7.776254098903452e-08, "2": 0}, "score": 4.999346355700399}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996990219729768, "4": 0.0002991073556558619, "3": 1.6568091569352965e-06, "1": 3.971396293023779e-08, "2": 0}, "score": 4.999697420117485}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9983863416489323, "4": 0.0016016860873579054, "3": 1.0292475126169501e-05, "2": 4.0560502325302954e-07, "1": 0}, "score": 4.998376510078696}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6492544528569718, "3": 0.21148599503856855, "1": 0.07423276124796047, "4": 0.0464924102565479, "5": 0.01833797559863774}, "score": 2.285308017021075}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7140902671882998, "4": 0.26607828739157474, "3": 0.018333505345132832, "2": 0.001232944090635934, "1": 0}, "score": 4.693474641657187}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.676688317378782, "5": 0.241857976275151, "3": 0.07566500581433698, "2": 0.005534522421071973, "1": 0}, "score": 4.155163364749566}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5865148450240375, "5": 0.31291293189457914, "3": 0.07877600764415842, "2": 0.018266527360049863, "1": 0.0025246261162271432}, "score": 4.190221175249049}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4874831272073123, "3": 0.2502990439920912, "2": 0.19142434762144786, "5": 0.06715219288707086, "1": 0.0036076863946585803}, "score": 3.4231620116171952}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5547732262984497, "5": 0.3795461052750059, "3": 0.06190876561673711, "2": 0.003606692974625707, "1": 0.00014269072957894433}, "score": 4.310002862507478}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9926813088127667, "4": 0.0072928635855652605, "3": 2.4995018823710118e-05, "2": 2.904556326085259e-07, "1": 0}, "score": 4.992656271028654}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9947117323803933, "4": 0.005270086515290258, "3": 1.7409178340236115e-05, "2": 1.8392146336373568e-07, "1": 0}, "score": 4.994694540244004}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962328011651292, "4": 0.0037565548684221845, "3": 1.0291327579169875e-05, "2": 1.268762036879117e-07, "1": 0}, "score": 4.9962224809949864}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.478416111035069, "5": 0.4248341378979387, "3": 0.09319275466112291, "2": 0.0034312539552262275, "1": 0.00012505636528710998}, "score": 4.324403928799287}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5977694108379323, "4": 0.39213518458756536, "3": 0.00961268786998135, "2": 0.00042571489343043515, "1": 4.4919345434753015e-05}, "score": 4.587177629698331}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9757536141080116, "4": 0.02401410290918239, "3": 0.0002142217209706581, "2": 5.017393410746597e-06, "1": 0}, "score": 4.975542082442786}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9513139735292668, "4": 0.04803436436283577, "3": 0.0006094650212154191, "2": 1.3948284948706948e-05, "1": 0}, "score": 4.950703468171934}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9685838555223482, "4": 0.029700119785494, "3": 0.0009141083030863543, "2": 6.92753094670264e-05, "1": 0}, "score": 4.968240569416422}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6414209046718429, "5": 0.27265405095747836, "3": 0.07597121959167781, "2": 0.009136212195825888, "1": 0.0007794336435736112}, "score": 4.176078828546388}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6271461822431782, "5": 0.3306145776639659, "3": 0.040784955635308096, "2": 0.0013707887155712524, "1": 0}, "score": 4.2871120172284245}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8469351937069601, "4": 0.1491022450471284, "3": 0.0039261891715174115, "2": 3.32275568739297e-05, "1": 1.9352926550474627e-06}, "score": 4.842937762845032}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979486753481265, "4": 0.002031662206588291, "3": 1.9139228136485375e-05, "2": 1.889347725947833e-07, "1": 0}, "score": 4.997929491840687}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9831615917770614, "4": 0.01660604322783727, "3": 0.00022611790300838613, "2": 5.06973505055434e-06, "1": 9.65904373374406e-07}, "score": 4.982922644532448}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998072065270506, "4": 0.00019150033499958744, "3": 1.0318420035095187e-06, "1": 4.9078489198703214e-08, "2": 0}, "score": 4.999806239625919}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8690717073782319, "3": 0.123642987390931, "1": 0.004797962165830284, "4": 0.0023520593862701375, "5": 9.493472573972177e-05}, "score": 2.123838944946629}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.44866051882936797, "3": 0.3754580994585501, "4": 0.16433237915227863, "5": 0.006242574509740748, "1": 0.004651997415003963}, "score": 2.718668902823798}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9387961697087599, "4": 0.0604642498604385, "3": 0.0006232987622205932, "2": 2.714173439796844e-05, "1": 0}, "score": 4.938202218761775}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7845436090637327, "4": 0.20354743610709491, "3": 0.010158145327513694, "2": 0.001473216018770192, "1": 0.00022128745505936288}, "score": 4.770818571065414}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6771689028253383, "5": 0.29968654516848986, "3": 0.021441816962179373, "2": 0.0015719721522275553, "1": 6.689120930413474e-05}, "score": 4.274917669728047}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6781591663262087, "1": 0.20540371397114626, "3": 0.07857016749526509, "4": 0.03580871426402234, "5": 0.0020432152682490815}, "score": 1.9509127904357093}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.993755695707958, "4": 0.006230488738888288, "3": 1.0063726846681275e-05, "1": 4.4691831478730765e-07, "2": 0}, "score": 4.993747575470472}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8707170250920332, "4": 0.1283587758032059, "3": 0.0008791128359269966, "2": 1.5037206420692856e-05, "1": 0}, "score": 4.869833975538685}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997369107140573, "4": 0.00026190125881243935, "3": 8.439639977116752e-07, "1": 8.550833332189645e-08, "2": 0}, "score": 4.999736068711618}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8295199159962677, "4": 0.1683713705899821, "3": 0.001845703635388483, "2": 0.0001683197691349591, "1": 8.263981266796726e-05}, "score": 4.8270996200976}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5970014361386797, "2": 0.21733679020475302, "4": 0.1684803421152409, "5": 0.015487825736941687, "1": 0.001689416121465101}, "score": 2.9787402820699636}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9698062283770967, "4": 0.029671538271513243, "3": 0.00047037326387291403, "2": 3.070933125132104e-05, "1": 0}, "score": 4.9692949377717}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9960682705676361, "4": 0.003892331280348617, "3": 3.344029326165143e-05, "2": 4.956796429707007e-07, "1": 0}, "score": 4.996039279460034}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8130939796415295, "4": 0.18212509369728425, "3": 0.0046235600362902985, "2": 0.00012976544582968223, "1": 0}, "score": 4.8082331969027745}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9673851346523279, "4": 0.03227385884877476, "3": 0.0003292507300602952, "2": 6.92078746007713e-06, "1": 0}, "score": 4.96704671800022}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6998848552283787, "4": 0.2880771075880487, "3": 0.011151993587200025, "2": 0.0007181637147035833, "1": 0}, "score": 4.687411936846388}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9829949973635056, "4": 0.016714945828612684, "3": 0.00027629097233092953, "2": 3.718608569897107e-06, "1": 0}, "score": 4.982721142796416}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9604378449571198, "4": 0.03926605004476799, "3": 0.00028739959313366927, "2": 2.052844839974687e-06, "1": 0}, "score": 4.960152727148065}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9897741828531177, "4": 0.010151622845689106, "3": 6.454660738451081e-05, "2": 2.620079230499089e-06, "1": 0}, "score": 4.989711351397193}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9894133274942921, "4": 0.010511950774940895, "3": 6.020747764447301e-05, "2": 1.558148968304843e-06, "1": 0}, "score": 4.989362822006479}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9518534834255125, "3": 0.027568942819572593, "1": 0.020107642747390193, "4": 0.000425785567968569, "5": 4.33865965417912e-05}, "score": 2.008443037404685}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.4134744152798963, "4": 0.39363578529993387, "2": 0.16936685111563035, "5": 0.022474629134644486, "1": 0.0010095866392210349}, "score": 3.2672093688702266}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5463956128220572, "5": 0.4436618525789799, "3": 0.009823684729098822, "2": 0.00010368013741344787, "1": 0}, "score": 4.433637385738177}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8776196321501168, "4": 0.12124792047903382, "3": 0.0011125795954625673, "2": 1.6012450213074404e-05, "1": 2.216480456676585e-06}, "score": 4.876469814610783}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7962214805045094, "3": 0.10363885201594987, "5": 0.098971376194696, "2": 0.0011397215509079696, "1": 2.2646777270990846e-05}, "score": 3.9929850991961633}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8289124571216467, "2": 0.17013655494392743, "3": 0.0008521005684619726, "5": 4.789238706996078e-05, "4": 4.2350810454038766e-05}, "score": 1.1721608662480199}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4371283587059402, "5": 0.35873210309352976, "3": 0.14977985443801276, "2": 0.05361119879426279, "1": 0.0005467062062082437}, "score": 4.100109932506617}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9827583442513586, "4": 0.017166827347084856, "3": 6.828830745272919e-05, "2": 2.67607068934228e-06, "1": 0}, "score": 4.982688500933903}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9058322496446958, "4": 0.0928686639069583, "3": 0.0012319894219342486, "2": 5.57893816330274e-05, "1": 6.687342482755735e-06}, "score": 4.904472798369794}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9882557544041327, "4": 0.011580391489793274, "3": 0.00013500199525073343, "2": 1.3455952294980984e-05, "1": 0}, "score": 4.988109053587924}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7395479188092102, "5": 0.13104661229811476, "3": 0.11897341668825663, "2": 0.010336465460631604, "1": 8.759882266583258e-05}, "score": 3.9911373974268267}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.768941350204077, "4": 0.22176575762531978, "3": 0.00894192579217317, "2": 0.00032272306061301474, "1": 2.3038369335735046e-05}, "score": 4.7592888152418364}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.49866006890940484, "5": 0.4545862701797934, "3": 0.04624374811743608, "2": 0.00041220613750085465, "1": 0}, "score": 4.4075579309098565}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952333546841733, "4": 0.004733726230709296, "3": 2.7589066638778845e-05, "2": 9.7924301248909e-07, "1": 0}, "score": 4.995208137058656}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6667585317342545, "4": 0.31427933079629944, "3": 0.018542772286625077, "2": 0.0003862482733706923, "1": 2.789346851356212e-05}, "score": 4.647362963957554}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5466746736601331, "5": 0.3295340803128885, "3": 0.11223471846768043, "2": 0.010583304147837438, "1": 0.0009563730513040092}, "score": 4.193266891012341}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9355800796714588, "4": 0.0620033725158182, "3": 0.0022187056359616276, "2": 0.00014277679803591223, "1": 5.0871281895874016e-05}, "score": 4.9329271193804125}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9557159915847409, "4": 0.04347457910933671, "3": 0.0007729744213715151, "2": 1.606746721752877e-05, "1": 0}, "score": 4.9549303507925195}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9743160902597462, "4": 0.0246767370247615, "3": 0.0009451669305367279, "2": 4.5168392351419534e-05, "1": 1.4050985813275507e-05}, "score": 4.9732411454328025}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.967333927475563, "4": 0.031073198994457353, "3": 0.0014193243932348256, "2": 0.00010583185467204143, "1": 6.156604850517069e-05}, "score": 4.965524180392217}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.815519161964254, "3": 0.11745777167429368, "4": 0.04041956617473741, "1": 0.016017186131370677, "5": 0.010493817549938746}, "score": 2.2137809445325054}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6058189923633637, "4": 0.35693217544492345, "3": 0.018655894944890807, "2": 0.017271728585945594, "1": 0.001155010319980784}, "score": 4.549245893042806}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9954822052758793, "4": 0.004497241815558768, "3": 1.3384637016999247e-05, "2": 4.444416774222145e-07, "1": 0}, "score": 4.995474625157525}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948704052362588, "4": 0.005112074441010088, "3": 1.512479663133369e-05, "2": 9.033633351040347e-07, "1": 0}, "score": 4.994854958198482}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7869171179690665, "5": 0.1851570490950931, "3": 0.026402887495006577, "2": 0.0013518080314705227, "1": 0.00010181847367772063}, "score": 4.155755886948422}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.4874830102113758, "2": 0.46273136428908296, "3": 0.046805432674835126, "4": 0.0018456648760191157, "5": 0.001091155557283946}, "score": 1.5662684069109303}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5079115808487789, "5": 0.4709615137913261, "3": 0.018676072871530655, "2": 0.002236682136997922, "1": 0}, "score": 4.4479079963005885}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.953557081976935, "4": 0.045882096154640825, "3": 0.0005155844223605747, "2": 7.359268637984954e-06, "1": 0}, "score": 4.953062879302139}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9890709399135718, "4": 0.010741763544315353, "3": 0.00016713127107251222, "2": 6.775848223463849e-06, "1": 0}, "score": 4.9889034977931095}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9926968193808551, "4": 0.007202475446759615, "3": 8.768962207208568e-05, "2": 5.95830805844864e-06, "1": 0}, "score": 4.992604218191097}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.908418621256022, "1": 0.04776647716789258, "3": 0.0415678103877489, "4": 0.0020228564141672417, "5": 0.00017952142460993988}, "score": 1.9983855381340228}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9840183507181156, "4": 0.015607089700268566, "3": 0.0002827495597495572, "1": 5.6167570779788125e-05, "2": 3.3590744172526365e-05}, "score": 4.9835019348154015}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9800030010757642, "4": 0.019847966905326253, "3": 0.0001300305025540542, "2": 2.1550836897754624e-06, "1": 0}, "score": 4.979885167975333}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9921006347718557, "4": 0.007858279418520566, "3": 3.890273505166705e-05, "2": 1.4432673811721581e-06, "1": 4.4210739909800994e-07}, "score": 4.992057814515249}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7264938436445969, "5": 0.22215292120289507, "3": 0.04602415093232625, "2": 0.00496474322421312, "1": 0.0003224791741798791}, "score": 4.165238763495274}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8436804414134724, "1": 0.15188456309332873, "3": 0.00434150724364065, "4": 7.63306497354722e-05, "5": 1.6285148507436658e-05}, "score": 1.8526583323468733}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6551932556963469, "3": 0.16990942126789588, "2": 0.10445737348806307, "5": 0.06870908822016887, "1": 0.0017286203053710788}, "score": 3.684698352462056}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7099197808843175, "4": 0.2884926990326871, "3": 0.0015520044344134983, "2": 2.8183214154379652e-05, "1": 0}, "score": 4.708316603706645}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8478500386865491, "4": 0.15101442755645816, "3": 0.001096294195417975, "2": 2.9584854496464526e-05, "1": 5.113492108343294e-06}, "score": 4.846683079275688}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6014700121033442, "3": 0.3515597838911045, "1": 0.038136265468656075, "4": 0.008078233957138817, "5": 0.0007548964276847852}, "score": 2.331844943800959}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5009495908627126, "4": 0.4866022425658466, "3": 0.011028013077237182, "2": 0.0013527063358846044, "1": 6.559120113827756e-05}, "score": 4.487020295399105}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.923202509471779, "4": 0.0760653378105149, "3": 0.0006101603905685998, "2": 7.511351915616535e-05, "1": 4.020540977000731e-05}, "score": 4.922327660873349}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8960826562347523, "5": 0.08953868611484057, "3": 0.0137204425688478, "2": 0.0006174914103026166, "1": 0}, "score": 4.074586298153273}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9703314362409742, "4": 0.02957931439381634, "3": 8.126354849078146e-05, "2": 4.449735062835279e-06, "1": 0}, "score": 4.970244704086857}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5891479137191391, "4": 0.40477296067150514, "3": 0.005216956985709122, "2": 0.0006235297995504451, "1": 0}, "score": 4.58282298132525}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7799283441444169, "3": 0.1984112266092837, "1": 0.01676365716158906, "4": 0.004454806737646548, "5": 0.0004003235751480748}, "score": 2.191766139130259}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6037261366583845, "2": 0.23280599773272592, "4": 0.098225855890961, "5": 0.043959158149738636, "1": 0.020845628854136742}, "score": 2.911608269877295}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6241442484125217, "5": 0.2829689796191459, "3": 0.09027031591595086, "2": 0.0025586589638245264, "1": 4.193926741904978e-05}, "score": 4.187458500656663}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7705566216733996, "4": 0.22454135037673117, "3": 0.004769837699131834, "2": 7.911112882318254e-05, "1": 0}, "score": 4.765669202765581}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8581860942043505, "4": 0.13624602774893918, "3": 0.005430666003387238, "2": 9.46036026169462e-05, "1": 0}, "score": 4.8526025490608875}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9445012033320875, "1": 0.04766490004834414, "3": 0.007690076096499162, "4": 0.0001182339818275421, "5": 2.4481250967799377e-05}, "score": 1.9603350439234233}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8096165892374184, "4": 0.18736700348519958, "3": 0.0029894914190810055, "2": 2.4440719124851474e-05, "1": 1.3489487129913991e-06}, "score": 4.806575077891109}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9203983762510128, "4": 0.0792352819651716, "3": 0.0003609210577995917, "2": 4.14925399550388e-06, "1": 0}, "score": 4.92003032647804}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5817802382890843, "5": 0.3392575247390836, "3": 0.07171565606874285, "2": 0.007060051026171918, "1": 0.0001777891073961304}, "score": 4.252890609754343}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9185866134228228, "4": 0.0799644914273601, "3": 0.0013517158413064963, "2": 8.725514762977715e-05, "1": 6.406566999506709e-06}, "score": 4.917044393375007}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6816482409021962, "4": 0.29245835456571, "3": 0.024006534856733135, "2": 0.00171381397049054, "1": 0.00013593754576761807}, "score": 4.653830534452983}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998229348378865, "4": 0.00016988072241949824, "3": 5.0363144666328515e-06, "1": 6.315106693810596e-07, "2": 0}, "score": 4.999817520329218}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8799925653601045, "4": 0.11311463561864686, "3": 0.006693754175349794, "2": 0.0001701127679406399, "1": 1.4732803790734557e-05}, "score": 4.8729267821642095}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999932502087799, "4": 6.417935918365192e-06, "3": 8.737505560480679e-08, "1": 0, "2": 0}, "score": 4.999993407312359}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962111608327701, "4": 0.00368901940554711, "3": 9.353292917330824e-05, "2": 2.868383291440801e-06, "1": 0}, "score": 4.996115296306569}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5358300173596252, "2": 0.3621474245217794, "3": 0.08053843138270368, "4": 0.015297699826850506, "5": 0.005943797738433681}, "score": 1.5930364656672782}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7446644237497575, "3": 0.17607321079668362, "2": 0.039681269644029675, "5": 0.03881287723171576, "1": 0.0007347391644756879}, "score": 3.7811655832056537}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.847210382241169, "3": 0.08624411994028958, "5": 0.0637848421955875, "2": 0.0027164312516137763, "1": 3.253266163147483e-05}, "score": 3.9720099345154556}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9918195772611177, "4": 0.008117097008495232, "3": 5.254093383885835e-05, "2": 2.4489896652277065e-06, "1": 0}, "score": 4.9917704055545205}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6144843120005395, "5": 0.3579322701518513, "3": 0.024956536677902187, "2": 0.002398580919612625, "1": 0.00019630401568772267}, "score": 4.327600141558581}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6822528309297178, "4": 0.2509288615853678, "3": 0.06264845868110985, "2": 0.003592440867976514, "1": 0.000517542143202705}, "score": 4.61090343630148}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9689987181023862, "4": 0.029492074875998833, "3": 0.0013679869490437278, "2": 8.669884465891124e-05, "1": 0}, "score": 4.967510083301782}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9836468211039503, "4": 0.015856949824958912, "3": 0.00047766533818399264, "2": 1.0228900109079856e-05, "1": 0}, "score": 4.98315689241386}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981016064328588, "4": 0.0018751999223321813, "3": 2.1030716467494806e-05, "2": 5.242983208626916e-07, "1": 0}, "score": 4.998081162605506}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995221358134775, "4": 0.00046841776498802686, "3": 7.69051351263986e-06, "1": 3.5080055301852904e-07, "2": 0}, "score": 4.999514797324013}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"4": 0.446929908908583, "3": 0.2843580771416755, "2": 0.2069938906335282, "5": 0.05993345593384815, "1": 0.0016910510843016883}, "score": 3.3564541978965843}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5813521299932847, "5": 0.35969346369190514, "3": 0.045688041010461554, "2": 0.012236108322036894, "1": 0.000914182440275957}, "score": 4.286823951675378}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5211063298750417, "3": 0.3681500055838825, "2": 0.06989495548102614, "5": 0.040042323369791674, "1": 0.0008009652460816043}, "score": 3.5296969618342473}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9816411039720427, "4": 0.0178440635553756, "3": 0.00045712000890552556, "2": 2.274857618046348e-05, "1": 1.7161071914078104e-05}, "score": 4.981104470016981}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.850435396046642, "3": 0.08879055475613933, "5": 0.05809104835839418, "2": 0.0026302799331409483, "1": 2.705859116377308e-05}, "score": 3.9639578330370573}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9641032608923233, "4": 0.03557013136102703, "3": 0.0003027691269962051, "2": 1.2577683061573929e-05, "1": 0}, "score": 4.963786189534372}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.984872677092603, "4": 0.015027551439986297, "3": 9.357783575602904e-05, "2": 8.860592632803486e-07, "1": 0}, "score": 4.984782553943015}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.987917305128401, "4": 0.012018069140598957, "3": 6.180093896547194e-05, "2": 3.8984445917571e-07, "1": 0}, "score": 4.98785712988084}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9658777457241855, "4": 0.03346179964174396, "3": 0.0006350121026257871, "2": 1.8891433360535143e-05, "1": 4.887591067938925e-06}, "score": 4.965191893585122}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9698483799812115, "4": 0.02986451478125006, "3": 0.0002735645361368652, "2": 6.8736795384049055e-06, "1": 0}, "score": 4.969567532213933}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5639935295381364, "2": 0.4329099674356035, "3": 0.002652958093082781, "4": 0.00022415001958237817, "5": 0.00021215614953605253}, "score": 1.4397401414537918}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6751177897501415, "3": 0.20376693780194577, "4": 0.10362413634380108, "5": 0.008859955827385321, "1": 0.008625528867272022}, "score": 2.428971973400698}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7613705153815888, "5": 0.17489805808866143, "3": 0.05922728784299906, "2": 0.004454647258420036, "1": 4.0702949453355574e-05}, "score": 4.106640304086522}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4765873294321468, "5": 0.45461016840817625, "3": 0.060623989372970935, "2": 0.006756775498432174, "1": 0.0013644953850175743}, "score": 4.376400687775044}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.3343503111068514, "2": 0.3203062851058221, "3": 0.1863006523072289, "4": 0.10988730921401997, "5": 0.04909658492809006}, "score": 2.21902760579451}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5020315061524263, "5": 0.46690974757549897, "3": 0.030030074984610168, "2": 0.000975816794230959, "1": 3.459639749371773e-05}, "score": 4.4348321890176825}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8797206192867141, "4": 0.11874042154432526, "3": 0.0014572080041736623, "2": 6.268445924367867e-05, "1": 1.012591073379552e-05}, "score": 4.878115515682496}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9949046185223902, "4": 0.0050261600296877115, "3": 3.6046852764498935e-05, "2": 1.4277482572914674e-06, "1": 0}, "score": 4.994897301025408}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7269715177510954, "4": 0.26693999064005114, "3": 0.005743630943981373, "2": 0.00028632329026704727, "1": 4.3741773374331074e-05}, "score": 4.7205346756501925}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9898726366283098, "4": 0.010011254187970865, "3": 0.00010493819501664022, "2": 5.776711395020289e-06, "1": 0}, "score": 4.989761484058416}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8440027551464327, "4": 0.13560271249845376, "3": 0.014372954472344763, "2": 0.004676176921547872, "1": 0.0012052189829029325}, "score": 4.816776287198067}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9961272794994216, "4": 0.0038330842985003625, "3": 3.263823839716268e-05, "2": 1.4675547171158687e-06, "1": 0}, "score": 4.996097214976557}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8920366498235974, "4": 0.10350307050518483, "3": 0.004123376138892578, "2": 0.00025919185955944335, "1": 5.7172473953122456e-05}, "score": 4.887241595775257}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9822796305520782, "4": 0.017506063015969544, "3": 0.00020297494706732658, "2": 4.524841540950611e-06, "1": 0}, "score": 4.9820742905513615}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9909795892294742, "4": 0.00893149397191239, "3": 7.983480465777424e-05, "2": 1.7956400962650438e-06, "1": 0}, "score": 4.990903383217314}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8446682772525547, "2": 0.1476413731795007, "3": 0.00583050885655889, "5": 0.000791058211987416, "4": 0.0007813471598799252}, "score": 1.1648580512501412}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5040211235416776, "4": 0.3084700570971382, "3": 0.11351183209057719, "2": 0.06470497416384888, "1": 0.008883066100377325}, "score": 4.234546061732075}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5636813609445526, "4": 0.40128278528517203, "3": 0.03411277948307264, "2": 0.0008021760985089183, "1": 0}, "score": 4.528028066901329}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8266333927557413, "4": 0.1675954901012431, "3": 0.005079271160639209, "2": 0.0005468709536061235, "1": 0}, "score": 4.8205793432017785}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5931351660230141, "4": 0.3870573793068683, "3": 0.018526417361213653, "2": 0.0011888170998231083, "1": 0}, "score": 4.5722838906022}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5403548098026378, "4": 0.31398313647804754, "3": 0.06162937840344685, "2": 0.04567048646962231, "1": 0.03813423667329958}, "score": 4.273043989410743}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9897649562211905, "4": 0.010097706097396686, "3": 9.300177304432598e-05, "2": 6.2772912509502476e-06, "1": 0}, "score": 4.989697066367356}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9032411562813452, "4": 0.09637182421645771, "3": 0.00036872922163733537, "2": 4.772172051494434e-06, "1": 0}, "score": 4.902875087879012}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9936880138093174, "4": 0.0062804477705552435, "3": 2.4819150629155115e-05, "1": 8.179856854063684e-07, "2": 0}, "score": 4.993666604610281}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8068410453014364, "4": 0.1895252154975848, "3": 0.0030800815656296986, "2": 0.0003515341487285058, "1": 0}, "score": 4.803220245114817}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5070042260608265, "4": 0.2807097953698408, "2": 0.17255380122141764, "5": 0.03492715053253856, "1": 0.004723279081191008}, "score": 3.16857751788124}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7237793849152182, "4": 0.25661712266829834, "3": 0.018315080270267042, "2": 0.001056077929020459, "1": 0.00021860305653506192}, "score": 4.702705988586132}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9534472900143476, "4": 0.04622596156899725, "3": 0.0003171866995130345, "2": 2.5500438573016893e-06, "1": 0}, "score": 4.953131686275101}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931039188526537, "4": 0.006502750745405565, "3": 0.0002972101778241324, "2": 3.6216200920790964e-05, "1": 0}, "score": 4.992793748612734}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9632269183751799, "4": 0.032923996835073306, "3": 0.0035808728336636586, "2": 0.00021236692522535184, "1": 5.391407405180566e-05}, "score": 4.95906142137509}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"1": 0.992254942726051, "2": 0.007605378383037871, "3": 0.00012924341417920688, "5": 2.426387578251793e-06, "4": 0}, "score": 1.0078736338223444}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.931962473119909, "4": 0.06583526117940716, "3": 0.002122208897394749, "2": 6.734613793225312e-05, "1": 7.570162684945998e-06}, "score": 4.929687640520395}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5257262915225247, "5": 0.4431418486842328, "3": 0.030298008339404617, "2": 0.0007818286180042892, "1": 2.6759179088157396e-05}, "score": 4.411210294247279}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5395212536348228, "3": 0.3373592137982234, "5": 0.06882924855752333, "2": 0.0537486354109443, "1": 0.000533758910188064}, "score": 3.6223685078120815}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8668070291870189, "4": 0.1280956920796153, "3": 0.005016880263098125, "2": 7.477051015389506e-05, "1": 4.405490297512061e-06}, "score": 4.8616284447474865}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8357070382739338, "4": 0.1601895463856125, "3": 0.0038585338471674936, "2": 0.00013976222110292206, "1": 0}, "score": 4.831656403100362}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6355557665247699, "4": 0.3520371743540163, "3": 0.011787507438180788, "2": 0.0005162196008370184, "1": 0}, "score": 4.622800175123802}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9963138555720246, "4": 0.003666048133299893, "3": 1.655561895277696e-05, "2": 2.001515514703049e-07, "1": 0}, "score": 4.996300227814962}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999797314573467, "4": 0.0002008980484956845, "3": 1.1199528183699696e-06, "1": 6.175882232398654e-08, "2": 0}, "score": 4.999796614887395}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999453318073601, "4": 5.419071359954944e-05, "3": 2.5391379939204713e-07, "1": 2.7605605141645898e-08, "2": 0}, "score": 4.999945191025639}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4647613179066847, "1": 0.45179324335813525, "3": 0.07744751483350872, "4": 0.004456934861499972, "5": 0.0013754270696218003}, "score": 1.638634594038539}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9927890491703547, "4": 0.0071451533876506134, "3": 5.609359068509218e-05, "2": 1.8631871782028014e-06, "1": 0}, "score": 4.992737012922802}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.988013179745365, "4": 0.011885239819969771, "3": 7.324020786698431e-05, "2": 1.970855195542836e-06, "1": 0}, "score": 4.987962049765526}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9751698939099842, "4": 0.02410327392985902, "3": 0.0006195036283571254, "2": 5.864413428836062e-05, "1": 0}, "score": 4.9744805440112225}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8418729726138062, "4": 0.15239080076284509, "3": 0.005309680579804876, "2": 0.0003676363454833197, "1": 4.7822849962490666e-05}, "score": 4.835693816003542}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.36063219155439885, "3": 0.31787702017828773, "2": 0.2566045230768978, "5": 0.059729484665994204, "1": 0.004990898127216564}, "score": 3.2135402641259696}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9110307027862703, "4": 0.08642340056240204, "3": 0.0021282377268435184, "2": 0.0003237483634318695, "1": 7.200975226467503e-05}, "score": 4.908058826298491}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7340308289172426, "4": 0.2629095558647163, "3": 0.0030038532434059875, "2": 5.028131605812257e-05, "1": 3.821532644399286e-06}, "score": 4.730916161125744}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9498768598496504, "4": 0.04946096531474329, "3": 0.0006455189442038584, "2": 1.4117152648824539e-05, "1": 1.3947282005357847e-06}, "score": 4.949200008310374}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9503993445794442, "4": 0.04904463878323069, "3": 0.000521923777948099, "2": 2.1707776447024813e-05, "1": 0}, "score": 4.949845769167224}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3645570952071571, "2": 0.3178607770775714, "3": 0.23051784520447063, "1": 0.04424233247250437, "5": 0.04280685609875764}, "score": 3.043826026889492}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9426852851146422, "4": 0.05706558834184606, "3": 0.00023254727971441932, "2": 5.947378641128584e-06, "1": 0}, "score": 4.942450863106987}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9379735065415618, "4": 0.06174958649090716, "3": 0.00027328263644437, "2": 1.4489694186353972e-06, "1": 0}, "score": 4.937699365801538}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9818942301829401, "4": 0.018049108247397666, "3": 5.3831487095360235e-05, "2": 7.054019886273048e-07, "1": 0}, "score": 4.981841073990528}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7712100300501136, "4": 0.22680086345839653, "3": 0.001883379894601959, "2": 5.5578729102792784e-05, "1": 0}, "score": 4.7692540691486585}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.956578889731535, "1": 0.03327582904700219, "3": 0.009992035033600754, "4": 0.00012651457993943376, "5": 2.4122078898444354e-05}, "score": 1.9770415414724085}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998290131599163, "4": 0.00016881139029972867, "3": 1.3740375988759247e-06, "1": 1.5040337282259147e-07, "2": 0}, "score": 4.999827838808932}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9997634718371976, "4": 0.00023423047299504302, "3": 1.7400286140791102e-06, "1": 4.911850447140883e-08, "2": 0}, "score": 4.999762092874772}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978260541505904, "4": 0.0021577298615208687, "3": 1.3276858508435547e-05, "2": 6.501927367061788e-07, "1": 0}, "score": 4.997813760839091}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994639113468984, "4": 0.0005286341252942346, "3": 6.32909058237914e-06, "2": 4.973417109096978e-07, "1": 3.0659168221079564e-07}, "score": 4.999455989126777}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5581380197298427, "4": 0.4082435893542933, "3": 0.029494092202912145, "2": 0.003871979515500733, "1": 0.00015302167193022398}, "score": 4.52049258710609}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7081297920396197, "4": 0.2638694251225935, "3": 0.02500418670337897, "2": 0.0024763870888745167, "1": 0.0004005031204902285}, "score": 4.677052368977152}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9604805133561468, "4": 0.038810381643943764, "3": 0.000681063507446899, "2": 1.0844418871988947e-05, "1": 0}, "score": 4.959794266663591}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.894313476871656, "4": 0.09209398935603498, "3": 0.011959372480760398, "2": 0.0013108113268547456, "1": 0.00029023372828248763}, "score": 4.878890007191588}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.898426283577689, "4": 0.09484708649946347, "3": 0.006294131422231534, "2": 0.0003387800436369125, "1": 9.030452392130029e-05}, "score": 4.891186720948226}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9742026036598439, "1": 0.013438457766335135, "3": 0.012070582317589965, "4": 0.00021387410723455456, "5": 4.863247696154709e-05}, "score": 1.999205749665498}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5273847610303658, "1": 0.462931145397134, "3": 0.0090875275908051, "4": 0.0003006490260394976, "5": 0.00029060866199333616}, "score": 1.5476271049035581}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5859551430683373, "5": 0.3514964736752818, "3": 0.05633159563043259, "2": 0.005799282940621641, "1": 0.0002249901352622246}, "score": 4.282945812943692}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9954698038349099, "4": 0.004422652277833497, "3": 9.878942434324787e-05, "2": 5.178464366436758e-06, "1": 0}, "score": 4.995364216902828}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7383345775523112, "4": 0.22217291586554963, "3": 0.035656828774087226, "2": 0.003584440084405199, "1": 0.0002407383256621765}, "score": 4.694793948550609}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9756007567150402, "4": 0.023230465352662807, "3": 0.0011497692602493097, "2": 1.7422553724691635e-05, "1": 1.1086427927423328e-06}, "score": 4.974413281677462}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9968670055022061, "4": 0.003092932837097794, "3": 3.715902062463881e-05, "2": 3.9904725240032355e-07, "1": 0}, "score": 4.996831544047372}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9988419936074732, "4": 0.0011429046711112448, "3": 1.3280669513680563e-05, "1": 7.168637803221773e-07, "2": 0}, "score": 4.998827665240262}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998275829655257, "4": 0.0001701854216030033, "3": 1.6259325985566657e-06, "1": 2.3273741340403394e-07, "2": 0}, "score": 4.999825631698517}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998219813671976, "4": 0.00017566039514327618, "3": 1.7408292113648458e-06, "1": 1.6006913840758474e-07, "2": 0}, "score": 4.999820217587659}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9990180469317569, "4": 0.0009790772612581677, "3": 2.5544056083084463e-06, "2": 6.828429761153956e-08, "1": 0}, "score": 4.9990156088254665}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9041173003349363, "4": 0.09444191401266541, "3": 0.0012929782508787136, "2": 0.00011435527594431702, "1": 1.7702264300225217e-05}, "score": 4.9025567198824}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9922263185683401, "4": 0.007712072660291349, "3": 6.003517004827325e-05, "2": 7.863144978929077e-07, "1": 0}, "score": 4.992165491888114}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9771617996519812, "4": 0.02274199644723607, "3": 8.742651028121699e-05, "2": 5.4252097266211344e-06, "1": 0}, "score": 4.977066798026784}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9855581332940007, "4": 0.01432333863101026, "3": 0.00010887180160341636, "2": 5.975391137178342e-06, "1": 0}, "score": 4.985440938002179}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"2": 0.885539779111282, "1": 0.09662823429333245, "3": 0.01749487321703707, "4": 0.0002553133356161897, "5": 5.8994873952148644e-05}, "score": 1.921552461207431}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.48771117639105177, "4": 0.2604382734482966, "2": 0.1870589446059177, "5": 0.06052135506172106, "1": 0.004228890979865011}, "score": 3.1859719487153493}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6439954423494201, "4": 0.3416889017167043, "3": 0.014135477599138588, "2": 0.00013158717476700405, "1": 0}, "score": 4.62962738472572}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.5215928376308079, "3": 0.45072303554365045, "4": 0.025108237485815324, "5": 0.0013241127056194985, "1": 0.0012265302878908847}, "score": 2.5036980348792253}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.978423742738493, "3": 0.014571364672257857, "1": 0.006970792911939319, "4": 3.174532777966957e-05, "5": 2.1432525491563733e-06}, "score": 2.007670493792743}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8628058967983955, "4": 0.12296125170865192, "3": 0.01117722559413535, "2": 0.0021818546652487983, "1": 0.0006987377953861932}, "score": 4.845316707177215}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9636782843492314, "4": 0.03505688328662681, "3": 0.0010952890258440254, "2": 9.963490529495756e-05, "1": 3.661864577049059e-05}, "score": 4.962305904534301}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.964372148216873, "4": 0.035299527514175984, "3": 0.0003218467684702424, "2": 3.705668068820443e-06, "1": 0}, "score": 4.964045562285}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9940072262328763, "4": 0.005966388356818735, "3": 2.1520254425377255e-05, "2": 3.450905467508082e-07, "1": 0}, "score": 4.9939895086948765}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.49957282286427984, "4": 0.4323046633786392, "3": 0.0632209465492327, "2": 0.00467665859257642, "1": 0.0002229961614234645}, "score": 4.42633038598281}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7733881282533515, "1": 0.22597554353779295, "3": 0.0006297337165957194, "4": 1.393469329436542e-06, "5": 0}, "score": 1.7746558050971368}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8732075569730033, "4": 0.11387096017406449, "3": 0.008879310245954867, "2": 0.0019967694088373384, "1": 0.0018385491938125308}, "score": 4.854995919657601}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.865870906706288, "4": 0.12981309419806236, "3": 0.003972407281157948, "2": 0.00017160727100226522, "1": 0}, "score": 4.861703484563541}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997783688938031, "4": 0.00021807794788035592, "3": 1.4815718099457282e-06, "2": 7.253381282614588e-08, "1": 0}, "score": 4.999778740864754}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9964258149600971, "4": 0.0033455271647051476, "3": 8.176183402073589e-05, "1": 1.2189934350579417e-05, "2": 0}, "score": 4.996441710106472}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5087549055057877, "1": 0.4471636920275599, "3": 0.04105398791728203, "5": 0.0015617498306916208, "4": 0.0014461274781039355}, "score": 1.6014600139664192}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.49954408326648286, "3": 0.28627373801175626, "5": 0.16049682797548206, "2": 0.05294440914237661, "1": 0.0006300707142729388}, "score": 3.7664181621099857}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9896701412800927, "4": 0.010044875249059242, "3": 0.0002583043544225815, "2": 9.688964505008492e-06, "1": 0}, "score": 4.989409269210455}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9955130388237245, "4": 0.004294116281057113, "3": 0.00014895698276167277, "2": 1.4319089225867563e-05, "1": 0}, "score": 4.995364875430564}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963622561802624, "4": 0.003513965876475034, "3": 0.0001072215825322254, "2": 3.7118171626687075e-06, "1": 0}, "score": 4.996260407473614}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5602966182696316, "4": 0.4276298474495025, "3": 0.011936999509022076, "2": 0.00012998298508971618, "1": 5.29403416842994e-06}, "score": 4.548084460042572}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6002045891322615, "4": 0.2849793093844354, "2": 0.0782070720576575, "5": 0.035791948969032705, "1": 0.0008168198412227487}, "score": 3.276722567700558}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9699774550221693, "4": 0.029664607809682473, "3": 0.000348815649587256, "2": 3.7038305132097716e-06, "1": 0}, "score": 4.9696264848453735}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9958062434605762, "4": 0.004175210511643179, "3": 1.775898451934112e-05, "2": 3.322925770278914e-07, "1": 0}, "score": 4.9957882727263}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9518890215387198, "4": 0.046456243937026354, "3": 0.0016249914902229916, "2": 2.6988303217256547e-05, "1": 2.509798718170684e-06}, "score": 4.95020275678106}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7617032536872549, "3": 0.12994794913159172, "5": 0.10086228574886275, "2": 0.007336855016811798, "1": 0.00010037212788046339}, "score": 3.9559373386031296}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9857540812346514, "4": 0.014167036304187119, "3": 6.437404719141284e-05, "2": 6.898870144065725e-07, "1": 0}, "score": 4.985701948362375}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9569135461607134, "4": 0.04293168274927045, "3": 0.000144511423236003, "2": 2.5937599936534547e-06, "1": 0}, "score": 4.956771181736185}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9747378236154679, "4": 0.025085612609417173, "3": 0.0001634113363561984, "2": 1.8083838719034671e-06, "1": 0}, "score": 4.97458185122138}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9935358371751661, "4": 0.006449252799008378, "3": 1.2945348804627424e-05, "2": 1.6853751010992748e-07, "1": 0}, "score": 4.993524339259663}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8547832935564109, "4": 0.132350708115294, "3": 0.009078017020792662, "2": 0.002874967238793528, "1": 0.0008952370629124781}, "score": 4.837284515280976}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9539873763108149, "4": 0.04083559301719539, "3": 0.002659082075878515, "1": 0.0016981032264134746, "2": 0.0007907810737473913}, "score": 4.944679878863779}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9766535956716877, "4": 0.023118965060479058, "3": 0.00020822298692018022, "2": 1.0507061531879145e-05, "1": 0}, "score": 4.976432862529714}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8857093000463834, "4": 0.1111411015284871, "3": 0.0027539104377291563, "2": 0.00031572578187247425, "1": 5.09503463743352e-05}, "score": 4.882196681171646}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9752794106630962, "4": 0.024366885989450037, "3": 0.0003203937018854326, "2": 1.460414741601561e-05, "1": 0}, "score": 4.9749480455552435}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8273322428141497, "1": 0.16515931920597823, "3": 0.007353808034447413, "4": 4.000500446704607e-05, "5": 0}, "score": 1.8422564174885716}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5003857389980637, "4": 0.24205935846237686, "3": 0.17291120191290235, "2": 0.07385194745052767, "1": 0.01064597917890967}, "score": 4.147854257953565}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5707073058282707, "4": 0.3047356498495479, "3": 0.07919282323399475, "2": 0.035666485950841965, "1": 0.008184108441442172}, "score": 4.396228928051453}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9844742595039692, "4": 0.015176097830114185, "3": 0.0003042392985281096, "2": 1.4932149274635191e-05, "1": 0}, "score": 4.984170144770034}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9701895812440672, "4": 0.028374687966964376, "3": 0.0013181816894666145, "2": 8.699890722680607e-05, "1": 0}, "score": 4.968726996536153}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9976469852894208, "4": 0.00233114526994886, "3": 2.1399649811905676e-05, "2": 3.270168952345259e-07, "1": 0}, "score": 4.9976250740406645}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998340188763911, "4": 0.0001642327383305882, "3": 1.1499041119253238e-06, "1": 8.873042467159504e-08, "2": 0}, "score": 4.999833112446676}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9803170345411836, "4": 0.01954785338222687, "3": 0.0001281900025176812, "2": 2.5940064125575646e-06, "1": 0}, "score": 4.980187898845386}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984713103382022, "4": 0.0015063928907447493, "3": 1.9785959261919258e-05, "2": 8.300291635216318e-07, "1": 0}, "score": 4.998451542500621}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9262980943454926, "4": 0.07032333504764147, "3": 0.002959635973898785, "2": 0.0003140268707752679, "1": 9.279461016290003e-05}, "score": 4.922443194494208}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5720500222156675, "5": 0.3805691818278866, "3": 0.04353792855434832, "2": 0.00344295556708317, "1": 0}, "score": 4.330277423990063}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6463769897170876, "5": 0.3147823283917874, "3": 0.037779195933370015, "2": 0.0010223064284484065, "1": 0}, "score": 4.274969292768986}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5163846734804297, "4": 0.46819409787303934, "3": 0.015228900617584806, "2": 0.00013759334478813753, "1": 0}, "score": 4.500908003214618}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9575662018539274, "4": 0.04180614252034786, "3": 0.0005914188958547087, "2": 1.9436515865896998e-05, "1": 0}, "score": 4.956951986924513}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5963092921276885, "4": 0.3835396015546028, "3": 0.019640229319075015, "2": 0.0004661714840534021, "1": 2.4238361352928575e-05}, "score": 4.575675787200994}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9809587776929747, "2": 0.01894856643847462, "3": 6.922537997064704e-05, "5": 3.065144023369445e-06, "4": 0}, "score": 1.0190996667458037}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5755681321947179, "5": 0.2881431136140988, "3": 0.11931537278084643, "2": 0.016001455374064725, "1": 0.0009135087533325029}, "score": 4.134092137123439}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6328820431101801, "5": 0.31718654758630777, "3": 0.048379084359121215, "2": 0.0014489581471720128, "1": 7.120667456853026e-05}, "score": 4.265704471997546}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8398655915561116, "4": 0.15737592640917558, "3": 0.002607945584433137, "2": 0.0001125558516954434, "1": 0}, "score": 4.837064326472461}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.43199204727202967, "3": 0.3327286786311021, "5": 0.13383434167272096, "2": 0.08057734084093927, "1": 0.020798121684131678}, "score": 3.5775272671692333}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9085645340879983, "3": 0.06198197264545587, "1": 0.018160470455584995, "4": 0.01039011921420362, "5": 0.00089040192148789}, "score": 2.0672737874177862}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4748185442680295, "3": 0.25218097360255043, "2": 0.15626885900765647, "5": 0.11173038350526773, "1": 0.004899464821169517}, "score": 3.5322656938606207}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8264486773659947, "4": 0.17044294017508602, "3": 0.002976713319619998, "2": 8.61537557902836e-05, "1": 0}, "score": 4.82333713104007}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8358925774725215, "4": 0.1609679342472561, "3": 0.0029107834710439305, "2": 0.00019485926069614734, "1": 2.4691611188819588e-05}, "score": 4.832525621533854}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5307070525978578, "4": 0.44045775085462546, "3": 0.025683230751328733, "2": 0.003009306877482317, "1": 0.00013451107773122887}, "score": 4.498605737418628}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.790303784574947, "3": 0.17252826514855288, "4": 0.030957870962076032, "1": 0.0045839417815972, "5": 0.0014296208639048467}, "score": 2.2341949510944894}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8590177273640995, "4": 0.14038118589030799, "3": 0.0005736621062762176, "2": 2.1070365149386124e-05, "1": 0}, "score": 4.858407379083358}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9899145764406252, "4": 0.01003523378544725, "3": 4.3663065338345084e-05, "2": 7.871925147148149e-07, "1": 0}, "score": 4.989875020393849}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9937495796573493, "4": 0.00623405235108882, "3": 1.3232852428700937e-05, "2": 5.585710560168737e-07, "1": 0}, "score": 4.993737790095875}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5310733668280261, "4": 0.4446832535650268, "3": 0.02319422392633917, "2": 0.0010138933062601157, "1": 2.2486532129317286e-05}, "score": 4.505790358590596}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4506980842070621, "3": 0.2784817086134206, "5": 0.20811339074654137, "2": 0.05885489918839817, "1": 0.003835087608365454}, "score": 3.800413261959034}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9875755912848128, "4": 0.012376097346426784, "3": 4.138744433761246e-05, "2": 7.12370283232031e-07, "1": 0}, "score": 4.987538913251334}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9845319139737183, "4": 0.015417784472437473, "3": 4.8044735091893e-05, "2": 2.9281934150158257e-07, "1": 0}, "score": 4.984485217128331}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9668210824183983, "4": 0.033069618109462615, "3": 9.674499100043047e-05, "2": 2.8417883592790968e-06, "1": 0}, "score": 4.966728043383165}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9960519471345727, "4": 0.0039080021290852345, "3": 3.142332834407276e-05, "2": 1.1320606521282771e-06, "1": 0}, "score": 4.996025725243701}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7964376600916305, "4": 0.16657153869633595, "2": 0.034602639974088335, "5": 0.0022576819001375917, "1": 0.00011724286562935516}, "score": 3.1362515802815163}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5839484912255528, "5": 0.4060398790268588, "3": 0.009874108013713119, "2": 0.00012683494023694913, "1": 6.2216619025257704e-06}, "score": 4.395895203871203}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8183822444683287, "4": 0.1798193038148229, "3": 0.0016916594647873834, "2": 7.588496369300226e-05, "1": 0}, "score": 4.816564052856807}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5716568386865161, "5": 0.4175213325785733, "3": 0.010676662439019049, "2": 0.00013799680848428114, "1": 4.0783828843148e-06}, "score": 4.406557698086272}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9483943046767777, "4": 0.05142547534625915, "3": 0.00017706069049663593, "2": 1.8555247830506118e-06, "1": 0}, "score": 4.9482147691827985}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6182185149246967, "3": 0.16716457045130992, "5": 0.15462142020510852, "2": 0.05869807186276042, "1": 0.0012753416187318272}, "score": 3.866231727443231}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5134642665799103, "3": 0.41646847937958403, "5": 0.03604314449173223, "2": 0.03366955036739645, "1": 0.0003270871201742447}, "score": 3.5512419747088964}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8490364081681346, "4": 0.1492969206351999, "3": 0.0016398698500840914, "2": 9.13650162631325e-06, "1": 0}, "score": 4.8473932343849}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902268150333519, "4": 0.009707155354517794, "3": 5.754421207300344e-05, "2": 1.21151853208147e-06, "1": 0}, "score": 4.990174050192945}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6961465572869892, "5": 0.22889408347467116, "3": 0.07264349731440403, "2": 0.0021491926908187983, "1": 0.00012807801340185322}, "score": 4.1515738161568665}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.39772806539405975, "5": 0.3152595219980245, "3": 0.25016544499992827, "2": 0.030035589012549622, "1": 0.006660598057753455}, "score": 3.985038848949337}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.538691369715698, "1": 0.3865983191472307, "3": 0.07001962633615935, "4": 0.0034348030197605124, "5": 0.0011975972752940646}, "score": 1.6938658621773826}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6825032295451037, "4": 0.3104185595797613, "3": 0.006854495257293025, "2": 0.0001998337074546191, "1": 1.2510797331311122e-05}, "score": 4.675219212474912}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7830438437396741, "4": 0.19090020011111292, "3": 0.024181284809308052, "2": 0.0014088708655243531, "1": 0.00045888239535667354}, "score": 4.754673390903403}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7391533421740945, "4": 0.24855341670150743, "3": 0.011841377658534527, "2": 0.00036210015975590416, "1": 8.17537808767087e-05}, "score": 4.726348320558617}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5035830323963434, "3": 0.3111445138412703, "4": 0.12728567617213102, "1": 0.031656246123159974, "5": 0.026309957481230963}, "score": 2.613002104402696}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7216284678501825, "4": 0.25485069884963074, "3": 0.02149912376059937, "2": 0.001770659151045656, "1": 0.00024148770430952363}, "score": 4.695870217061715}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9440839846534859, "4": 0.05472008239020635, "3": 0.0011563104377698972, "2": 2.832128261745364e-05, "1": 8.07136455611048e-06}, "score": 4.942849862840585}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996746002139981, "4": 0.00030727790249133243, "3": 1.3884874163668745e-05, "1": 2.428025942752924e-06, "2": 9.937765046377087e-07}, "score": 4.999652258632416}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975353519447545, "4": 0.0023045897523523797, "3": 0.00014371246865406762, "1": 8.223266856924654e-06, "2": 7.33127583936332e-06}, "score": 4.9973530963209205}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.45867829362735746, "5": 0.20687306218008722, "3": 0.17372744776457802, "2": 0.15132473324518886, "1": 0.009325492498447463}, "score": 3.7024985565487554}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9463037667243178, "4": 0.05293043895625106, "3": 0.0007095607083849927, "2": 3.98153118424487e-05, "1": 1.0847076080107283e-05}, "score": 4.945487301684726}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.871755085304276, "4": 0.12518261347092635, "3": 0.0030069214430782218, "2": 4.937526340363768e-05, "1": 3.5583841734469905e-06}, "score": 4.868640862993943}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963518336877583, "4": 0.0036040718617231407, "3": 3.915325489119678e-05, "2": 2.016191947971709e-06, "1": 0}, "score": 4.996311562263957}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4869891867231295, "3": 0.3837199459079126, "2": 0.08986170514024122, "5": 0.038143138242911885, "1": 0.001265445177170072}, "score": 3.4708925581222125}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9683192232355049, "2": 0.031638400198102594, "3": 3.9142058661435104e-05, "5": 5.223129017549672e-07, "4": 0}, "score": 1.0317188595947597}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6009348457845336, "4": 0.3752443369455615, "3": 0.022426349376107216, "2": 0.0013310323963608107, "1": 6.207582104476529e-05}, "score": 4.575660986865224}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5776681847389055, "5": 0.4098344013579324, "3": 0.012325068515523391, "2": 0.00015264295365291925, "1": 0}, "score": 4.3972118729758085}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9787202099236026, "4": 0.02109516313682689, "3": 0.00017707680375261305, "2": 6.496551891804097e-06, "1": 7.673314428816153e-07}, "score": 4.978528118127841}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9881197837200754, "4": 0.011784348809462506, "3": 9.15391324556188e-05, "2": 3.289914438697803e-06, "1": 5.860674216367341e-07}, "score": 4.988020353493558}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.55647505169957, "4": 0.43131747892828015, "3": 0.012069459805632047, "2": 0.00013150850915985416, "1": 5.337794528224242e-06}, "score": 4.544127194454974}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999453318073601, "4": 5.4128646612940465e-05, "3": 4.1272967427431596e-07, "2": 9.392118094441853e-09, "1": 0}, "score": 4.9999450177112275}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9700073996583913, "4": 0.029632160621235606, "3": 0.0003512759363148792, "2": 3.748214367698366e-06, "1": 0}, "score": 4.969653878521496}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.995812030605376, "4": 0.004169679936308544, "3": 1.754499208596277e-05, "2": 3.2729039566619323e-07, "1": 0}, "score": 4.995794246453793}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9592363527083122, "4": 0.04051747971824112, "3": 0.00023677079369447093, "2": 6.7021847676335284e-06, "1": 1.4309013465257872e-06}, "score": 4.958983096701882}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9301662326712402, "1": 0.04107480345901064, "3": 0.028130403850691783, "4": 0.000595424655656883, "5": 2.9722536356991767e-05}, "score": 1.9883355775034097}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5777444939691597, "4": 0.4165085455744534, "3": 0.005620466002049172, "2": 0.00011252737866695435, "1": 0}, "score": 4.571906961077579}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6638763743817198, "4": 0.3286551678228042, "3": 0.007355585664667297, "2": 8.671384485651693e-05, "1": 0}, "score": 4.656364530398414}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7471069211667438, "4": 0.2503129610058265, "3": 0.002543510666702015, "2": 3.0307389418004577e-05, "1": 0}, "score": 4.744507485948105}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7530010023808965, "3": 0.1311707984545624, "5": 0.10918481304746752, "2": 0.006431816350404273, "1": 0.00019583501762749834}, "score": 3.9645623192362005}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9979858407465758, "4": 0.0019568309040478107, "3": 5.42466130364787e-05, "2": 1.908568639980913e-06, "1": 8.686174736679233e-07}, "score": 4.997925475062268}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6573245727736041, "5": 0.24799162588004042, "3": 0.08666160865594502, "2": 0.00784394015559149, "1": 0.00013440001745523134}, "score": 4.1452453062328605}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7318185340920469, "4": 0.26325248192428946, "3": 0.0046268531832573375, "2": 0.00025411871963636266, "1": 0}, "score": 4.7267183347289015}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964098382970235, "4": 0.003575373617160981, "3": 1.0562442595936353e-05, "1": 0, "2": 0}, "score": 4.996403486300063}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992705570729384, "4": 0.0007217687941969668, "3": 2.635641373727759e-06, "1": 0, "2": 0}, "score": 4.999272956259852}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9662641402837531, "3": 0.032510807710135765, "1": 0.0011904927284926805, "4": 3.305978397249617e-05, "5": 1.018308133977446e-06}, "score": 2.0313895045781654}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9520464246415355, "4": 0.04748357581739136, "3": 0.000434259012015611, "2": 3.685810908319908e-06, "1": 0}, "score": 4.951635298408974}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.818177838115077, "4": 0.17536992131166276, "3": 0.006413009611910433, "2": 3.32596702021102e-05, "1": 0}, "score": 4.811703156078633}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987340233254387, "4": 0.0012417316271741317, "3": 2.1420845955579382e-05, "2": 7.748464161047084e-07, "1": 0}, "score": 4.998713099504349}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9645375965920088, "4": 0.03521499122388654, "3": 0.00024426301082137823, "2": 1.1951534150809909e-06, "1": 0}, "score": 4.9642928275217}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5065840430679289, "1": 0.4921222587327214, "3": 0.0012723432497943991, "4": 1.2029579293928087e-05, "5": 8.266494667737317e-06}, "score": 1.5091984234618534}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7153228140474487, "4": 0.2780293208971783, "3": 0.0063015187702223675, "2": 0.00027616694553045336, "1": 6.589420872892054e-05}, "score": 4.70827431380812}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9428105103177118, "4": 0.055221080802929666, "3": 0.0018034171448221938, "2": 0.00013230734111304267, "1": 1.832967915655309e-05}, "score": 4.940700992947159}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938951086407034, "4": 0.006086896092572898, "3": 1.7432156197032124e-05, "2": 3.407931983784919e-07, "1": 0}, "score": 4.993877215854237}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9952991303372176, "4": 0.004652623615998404, "3": 4.097862371610251e-05, "2": 2.028163204259881e-06, "1": 0}, "score": 4.995259309809248}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8684662622972024, "3": 0.1016806560517399, "4": 0.024233546178319115, "1": 0.0033303229423743974, "5": 0.00227573545932133}, "score": 2.153646702551493}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8532872717939397, "4": 0.11927452619054157, "3": 0.023268285103006194, "2": 0.0039726865512060405, "1": 0.00018637645091254038}, "score": 4.821523400977165}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5063522022241549, "4": 0.466179092508609, "3": 0.026970119796434596, "2": 0.000480799410896928, "1": 8.99843396191692e-06}, "score": 4.4783976922840125}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6593981459969739, "4": 0.3314852715687861, "3": 0.008647984421897983, "2": 0.0004161257748542194, "1": 0}, "score": 4.649952014461827}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4900401071012759, "5": 0.4689938141821111, "3": 0.038435652485056676, "2": 0.002420698848816306, "1": 8.339726857793359e-05}, "score": 4.425477775072078}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6262846053912219, "5": 0.2786127093633932, "3": 0.07228892808965352, "2": 0.02118198548102887, "1": 0.001562695131486084}, "score": 4.159282727617441}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9518985214385591, "4": 0.04672151564297632, "3": 0.0012963577208032738, "2": 4.222483512311498e-05, "1": 0}, "score": 4.9505570484427865}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7838937741243139, "4": 0.20750289242727135, "3": 0.008142465156801615, "2": 0.0003620127955282731, "1": 0}, "score": 4.775103906657667}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912058190224137, "4": 0.008768820274039373, "3": 2.418185498611268e-05, "2": 4.583581369483048e-07, "1": 0}, "score": 4.991181434587886}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6792924617035967, "4": 0.27995813635750005, "3": 0.02925552600207906, "2": 0.006995727314007606, "1": 0.004010096392189791}, "score": 4.624319892613148}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8858394876234572, "1": 0.09731173409407605, "3": 0.01603403866381494, "4": 0.0006736222931852504, "5": 0.0001397221849620269}, "score": 1.9204886047814276}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7955342638809051, "4": 0.20110458155331876, "3": 0.003240648548237427, "2": 0.00010109862827822221, "1": 0}, "score": 4.792106790800936}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5958505132924161, "5": 0.39366641135536834, "3": 0.010165738330094909, "2": 0.0003066107592508214, "1": 8.874150016305068e-06}, "score": 4.382861538159498}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9673424090966225, "4": 0.032538645621989826, "3": 0.0001140050856043872, "2": 2.0532800892155533e-06, "1": 0}, "score": 4.967227089753904}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5214307517663204, "4": 0.46538284014059045, "3": 0.012844448298806934, "2": 0.00032976311322019944, "1": 1.057261912736968e-05}, "score": 4.507895884238063}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8385648417992774, "1": 0.16012655622484612, "3": 0.0013005574483536014, "4": 5.777572189145719e-06, "5": 2.013159861307539e-06}, "score": 1.841191555542606}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.4125876545098407, "5": 0.2961950763522902, "2": 0.15086870857796353, "3": 0.13424044786072456, "1": 0.0061006924368952695}, "score": 3.8419139609850803}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8023975706048093, "4": 0.09670712478222467, "3": 0.050879590923914246, "2": 0.04318457101313214, "1": 0.0068167408675876345}, "score": 4.644707900011475}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959711735851065, "4": 0.004005543509215414, "3": 2.1901049498152223e-05, "2": 1.0323766361252292e-06, "1": 3.1583039251482407e-07}, "score": 4.995946293803905}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5753094149264831, "5": 0.37168013007316975, "3": 0.049325030930408006, "2": 0.003618806513168016, "1": 6.619298946164289e-05}, "score": 4.314919040852371}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5208325968961927, "3": 0.4210452242700429, "2": 0.05122404644818399, "5": 0.006743231620833792, "1": 0.00010580920907830642}, "score": 3.482907101932397}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9520729061811273, "4": 0.04769693208655352, "3": 0.0002221355004277797, "2": 3.0373169940046597e-06, "1": 0}, "score": 4.951849444742586}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7971522177770283, "3": 0.12043236137963556, "5": 0.08112387269141583, "2": 0.0012735398147466265, "1": 1.0181329053600512e-05}, "score": 3.958113559849619}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9145136729300004, "4": 0.08501225129462708, "3": 0.0004588230198163944, "2": 6.652592031950699e-06, "1": 0}, "score": 4.914049405700479}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7545181616177403, "4": 0.24325675220678564, "3": 0.00215665040360106, "2": 5.253326342247194e-05, "1": 0}, "score": 4.752268407642003}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"1": 0.6781105847437462, "2": 0.31866958394551864, "3": 0.003098880691343749, "4": 4.947411274683832e-05, "5": 4.674547959779269e-05}, "score": 1.32521079238174}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7173967099278935, "3": 0.11177336327524381, "4": 0.08834398182210254, "2": 0.049206856767559606, "1": 0.0332092774775993}, "score": 4.407610256254115}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.891590181282694, "4": 0.09142996587886083, "3": 0.014633051608806754, "2": 0.0015832841709691123, "1": 0.000663909973339489}, "score": 4.8718856774029975}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9900792030230393, "4": 0.004365130033936171, "1": 0.0034241911354204505, "3": 0.0014851379728995048, "2": 0.0006219073072773998}, "score": 4.9771015481354945}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6368496879094213, "4": 0.26098997039582655, "3": 0.07816917427510069, "2": 0.017774996503530444, "1": 0.006080706433701692}, "score": 4.504956805038392}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5175833779546263, "2": 0.34118879632395244, "4": 0.1339567087847106, "5": 0.004731414843304966, "1": 0.002424349592125636}, "score": 2.7973586677785818}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8026521555649907, "3": 0.18065280396059094, "5": 0.015077123257773436, "2": 0.0016099235267933354, "1": 4.0419755014429e-06}, "score": 3.831191679234828}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8567455776627546, "4": 0.14179758444114152, "3": 0.00139101497564341, "2": 2.9742010995553468e-05, "1": 0}, "score": 4.85532593960291}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8487648533476772, "4": 0.1475658149013614, "3": 0.0036162887001354236, "2": 4.634333840565462e-05, "1": 5.413493093436517e-06}, "score": 4.845040724399161}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5821620404413709, "5": 0.38850610306220484, "3": 0.02761374011173548, "2": 0.0016530728330212967, "1": 6.034520902907035e-05}, "score": 4.357406860877234}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"2": 0.602935411459087, "3": 0.3038459042513794, "4": 0.07740318882079834, "1": 0.010581875498213498, "5": 0.005217995263454489}, "score": 2.4637316378561254}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.3106119795349146, "4": 0.31004907114933816, "3": 0.2915654121234375, "2": 0.07969585516470239, "1": 0.008032547126608997}, "score": 3.8355497932584455}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.4784732564680283, "4": 0.4558184247977208, "2": 0.0390621856061682, "5": 0.026429031367921886, "1": 0.0002074373897436957}, "score": 3.469203961708796}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99085468808798, "4": 0.009031864991890338, "3": 0.00010294610079013721, "2": 3.7007761131496375e-06, "1": 0}, "score": 4.990751077585117}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9462702539698499, "4": 0.05114917580543757, "3": 0.0024390896586741406, "2": 0.00010520002710590545, "1": 2.2444140052692592e-05}, "score": 4.943566487399095}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6281202374076619, "5": 0.20726920984957373, "3": 0.15823315011395106, "2": 0.006256744982177749, "1": 0.00011171405854064303}, "score": 4.036187751243986}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4664132664450206, "4": 0.42768986951054166, "3": 0.09447536181600139, "2": 0.010992588565932363, "1": 0.0003511591564817774}, "score": 4.348926380626073}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6857359074093118, "4": 0.3085929143331266, "3": 0.005596915144934347, "2": 5.7662414029908954e-05, "1": 0}, "score": 4.6800349564916655}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5763896910956307, "5": 0.374642080796369, "3": 0.047799217973767134, "2": 0.001100149719283698, "1": 5.676798701586327e-05}, "score": 4.324476183127848}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9815651769691651, "4": 0.0177927608184478, "3": 0.0006023571597260895, "2": 2.615359240563904e-05, "1": 1.0941802633514354e-05}, "score": 4.980880246978339}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9169761002888951, "2": 0.08289098236660183, "3": 0.0001298137924622552, "4": 3.030821336553224e-07, "5": 0}, "score": 1.0831517520619067}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6363615514762699, "5": 0.3405509267382084, "3": 0.022407039636653418, "2": 0.0006234777369858247, "1": 0}, "score": 4.316914997180614}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9791992501525018, "4": 0.02067363628212372, "3": 0.00010897805786394554, "2": 1.224943300922489e-06, "1": 0}, "score": 4.979104379415512}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7592242657001136, "4": 0.23191009592147896, "3": 0.008459146474438283, "2": 0.000356556801430816, "1": 3.452589278208741e-05}, "score": 4.749959984235174}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.83772270853059, "3": 0.1025891810152463, "5": 0.05282167822967694, "2": 0.006619686279233744, "1": 0.00023020991301136233}, "score": 3.9363014415955133}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9033587659361154, "4": 0.09422061297001291, "3": 0.002232162349225698, "2": 0.0001311779184652204, "1": 0}, "score": 4.900915852954336}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7378869133989028, "5": 0.18485474952288278, "3": 0.07092856749573995, "2": 0.006226175619026729, "1": 6.434476366244875e-05}, "score": 4.101284771844347}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9983515305208724, "4": 0.0016239536147445138, "3": 8.59040221012212e-06, "1": 0, "2": 0}, "score": 4.998358839444595}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984522962306982, "4": 0.0015349553289924812, "3": 6.7709036592462465e-06, "2": 2.054222952133643e-07, "1": 0}, "score": 4.998450877655092}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9974637086357713, "4": 0.0024973572655641683, "3": 3.385462282444879e-05, "2": 2.070459488912136e-06, "1": 0}, "score": 4.997428714373279}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5904523977838487, "4": 0.20277262532109708, "2": 0.19981444861338657, "5": 0.0058253394881569295, "1": 0.0011317066227191526}, "score": 3.0123454854276748}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9562281057989781, "4": 0.041456118363780714, "3": 0.0020241233211319913, "2": 0.00023033633295270407, "1": 5.046048516268608e-05}, "score": 4.953602280374814}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8911189845205076, "4": 0.10692137796298427, "3": 0.0018709729299881636, "2": 6.506654776742264e-05, "1": 0}, "score": 4.889138860428268}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9877735202774544, "4": 0.012116946124699525, "3": 0.0001015299224972201, "2": 2.8775020037488984e-06, "1": 0}, "score": 4.987671298325233}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993509201435279, "4": 0.0006439693668463756, "3": 4.931023425867237e-06, "2": 1.0658958837636848e-07, "1": 6.780295899217184e-08}, "score": 4.99934557760238}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9464975659200867, "4": 0.044597521198929464, "3": 0.006115518634182285, "1": 0.0013773154506945158, "2": 0.0009787469763124226}, "score": 4.93469764121102}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.667074376691902, "3": 0.2960361807098331, "4": 0.01938554100140052, "1": 0.01501350724607371, "5": 0.00245509456286219}, "score": 2.327170588207527}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5544547392276001, "4": 0.30582017902773234, "5": 0.08423596594041055, "2": 0.054837336172654384, "1": 0.0005857483485249364}, "score": 3.418310899644278}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9342504116460967, "4": 0.061710943346330045, "3": 0.0037729390212666316, "2": 0.00020410663093881678, "1": 3.795254478927237e-05}, "score": 4.929977392727832}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9977726514303421, "4": 0.0021869696824579187, "3": 2.9031154834271618e-05, "2": 1.2023302610280953e-06, "1": 0}, "score": 4.997751338203512}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5322636125788214, "4": 0.26592413969264095, "2": 0.1776657682946668, "5": 0.022096222779959745, "1": 0.002036297644832676}, "score": 3.128380013726005}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.727337429145958, "4": 0.23902928575921192, "2": 0.018576168188359537, "5": 0.014979510175386552, "1": 7.341553472372457e-05}, "score": 3.2502663557676175}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8210702227469074, "4": 0.1728784902081253, "3": 0.006014743342752183, "2": 3.164390509361966e-05, "1": 0}, "score": 4.814996184909929}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6422675933901713, "4": 0.3279662408935739, "3": 0.029093561022300173, "2": 0.0006373522962075076, "1": 2.8776628807675885e-05}, "score": 4.611816959874299}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5958404792542591, "4": 0.3564127534267651, "3": 0.044135152729870494, "2": 0.003318037782990788, "1": 0.00024416337184069776}, "score": 4.544363659720805}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.948267260595341, "3": 0.03984012933143699, "1": 0.010961901697151494, "4": 0.0008818081875866684, "5": 4.6822439193644086e-05}, "score": 2.0307823752850984}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5972279336782435, "3": 0.3870538958061303, "4": 0.014779661001857304, "1": 0.0007737969943328425, "5": 0.00016091906841793834}, "score": 2.4163237573245464}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5751804852763567, "4": 0.3219499114631004, "2": 0.0987701347285056, "5": 0.0038830303971461888, "1": 0.00019969866551769697}, "score": 3.2305502994875286}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7027665985856565, "3": 0.21971845548538424, "5": 0.047851419303878796, "2": 0.029182498962196074, "1": 0.0004535388613584793}, "score": 3.7684009829306135}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.713571383584174, "3": 0.1873472935131956, "1": 0.09004533619355995, "4": 0.008592180788026668, "5": 0.0004391032407441072}, "score": 2.1158041732079247}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.981984923104114, "1": 0.010132056200766192, "3": 0.007874268401365098, "4": 8.194060462434706e-06, "5": 5.783356080578829e-07}, "score": 1.9977603353733704}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9298387787923551, "4": 0.06902449758030606, "3": 0.0010936013916665237, "2": 3.0896396468608435e-05, "1": 0}, "score": 4.928694738680297}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.666118257760134, "5": 0.29357727102601006, "3": 0.03889160349943174, "2": 0.0013570500716853728, "1": 3.6904096382625735e-05}, "score": 4.251865618766115}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7451658857146828, "4": 0.2506072766575983, "3": 0.004017272858387909, "2": 0.0001631259428468432, "1": 2.457661934755581e-05}, "score": 4.740764825866622}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993919865751202, "4": 0.0006023129483331433, "3": 4.720754119728211e-06, "2": 1.934824550816766e-07, "1": 0}, "score": 4.99938766461462}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"1": 0.948816419826934, "2": 0.05060342587201816, "3": 0.0005634123963572707, "4": 7.651353482181417e-06, "5": 6.8029446687140085e-06}, "score": 1.0517805349573444}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6898431817826306, "4": 0.19423288533490327, "3": 0.07113920412298638, "1": 0.023284962803355153, "2": 0.02045895899014843}, "score": 4.5084603803751}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8593074971355862, "4": 0.13301669929941393, "3": 0.007564069045913477, "2": 8.124510375883042e-05, "1": 0}, "score": 4.8516069028787125}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.3976791319433413, "5": 0.39647115087979234, "3": 0.17732063287487843, "2": 0.023294390464327797, "1": 0.0050941080062972925}, "score": 4.157301527423374}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6106222865015496, "3": 0.1930882964763363, "5": 0.15767256022410822, "2": 0.03512920300434649, "1": 0.0032771556915612786}, "score": 3.88447007183378}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7157045763704709, "3": 0.17097090211996338, "4": 0.07651075192395805, "1": 0.030438287676057562, "5": 0.006003596936256323}, "score": 2.3116808185134596}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9497191943273138, "4": 0.049879125021209024, "3": 0.0003229513064922791, "2": 3.034523665175985e-05, "1": 0}, "score": 4.949381487524259}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6366702807850183, "4": 0.3580788734314513, "3": 0.005166579576646748, "2": 6.546695804059522e-05, "1": 0}, "score": 4.6313846368491935}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9875143249831747, "4": 0.012465779859807007, "3": 1.8324400969051462e-05, "2": 3.537388174278489e-07, "1": 0}, "score": 4.987496494904822}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5076034482105427, "5": 0.4795939167100627, "3": 0.012070575075242748, "2": 0.0006858386239277342, "1": 2.6072772170971644e-05}, "score": 4.466082836990854}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5191135674522216, "5": 0.24183698391389194, "3": 0.17679408238709085, "2": 0.05925171228853017, "1": 0.0027603563369394176}, "score": 3.9382433827008327}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.969511175781211, "4": 0.030193201374328023, "3": 0.0002840208235874526, "2": 7.359636610616092e-06, "1": 0}, "score": 4.96921654747343}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7501732793529092, "4": 0.2389443737394952, "3": 0.010404885744743, "2": 0.0003845318260047278, "1": 5.412041968391775e-05}, "score": 4.738865643272651}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935327757979076, "4": 0.006346460646338904, "3": 0.00010472947092414607, "2": 4.4306112665774744e-06, "1": 0}, "score": 4.993430712351457}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9894525446581414, "4": 0.010429363893379702, "3": 0.00010411421919296613, "2": 3.5716495859504493e-06, "1": 0}, "score": 4.989351581916513}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"2": 0.708559721876657, "1": 0.2569103211304759, "3": 0.03412685049457459, "4": 0.0003451651706474184, "5": 5.588771328969534e-05}, "score": 1.778074067094981}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945700909394641, "4": 0.0053908403344899115, "3": 3.616220663876773e-05, "2": 1.3741049283678295e-06, "1": 1.1617227793329568e-06}, "score": 4.9945280640179295}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9859852282328414, "4": 0.013775600932924445, "3": 0.00022627386506425036, "2": 9.807570210797278e-06, "1": 2.511518519257257e-06}, "score": 4.985732374307257}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987868110095071, "4": 0.0012041377841263046, "3": 8.481069464633416e-06, "2": 1.921429904834721e-07, "1": 1.7104622420234908e-07}, "score": 4.998777639210112}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9112195152419356, "4": 0.08726578651472863, "3": 0.0014612613176851752, "2": 4.246259445698397e-05, "1": 8.838662444023307e-06}, "score": 4.909648755456423}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6252595346502593, "1": 0.18458574147690415, "3": 0.16264797112676466, "4": 0.021858714587463572, "5": 0.005561530159719154}, "score": 2.038467577057058}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9861610539480903, "4": 0.013546067434721806, "3": 0.00015933000555453964, "2": 6.8291591720867475e-06, "1": 0}, "score": 4.9861130253268255}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7572122816162866, "4": 0.23860211622873623, "3": 0.004069484280354276, "2": 6.210531406379903e-05, "1": 0}, "score": 4.753059261366763}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7626625445792987, "4": 0.22649513801655816, "3": 0.010176928830170982, "2": 0.0004953103609770688, "1": 0.00011421413435139886}, "score": 4.751194317402543}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6968263628423659, "4": 0.2854875667132111, "3": 0.01552073511021286, "2": 0.0015603153979232669, "1": 0}, "score": 4.678595560779255}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8413144573812836, "4": 0.12321956914917293, "3": 0.024622392151726655, "2": 0.00917588529296387, "1": 0.0016107795896615296}, "score": 4.793553122089491}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9006829410768775, "4": 0.09530721146392102, "3": 0.0035852022173790085, "2": 0.0002670597878765846, "1": 0}, "score": 4.896704926936711}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9785361661712164, "4": 0.021185824004557756, "3": 0.0002353334766841217, "2": 6.744933011046876e-06, "1": 0}, "score": 4.9783224953396354}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9115239863136037, "4": 0.08731610974493174, "3": 0.001082602190753088, "2": 5.1119680393391194e-05, "1": 0}, "score": 4.910362979949619}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975302534548467, "4": 0.0024538844995478154, "3": 7.859740243264333e-06, "1": 1.9574520459001775e-07, "2": 0}, "score": 4.9975295937537725}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.871707340585755, "3": 0.06546440625494049, "1": 0.05005219089765738, "4": 0.01013916531786132, "5": 0.002625868186252972}, "score": 2.043568631059633}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9428572390501992, "4": 0.054142051663127896, "3": 0.002712062129659273, "2": 0.00018430971162893643, "1": 7.67619103364407e-05}, "score": 4.939572180971879}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5793443765891495, "5": 0.39713428742970375, "3": 0.02280923457050697, "2": 0.0006533691333272537, "1": 0}, "score": 4.373040224094433}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6594516385442055, "4": 0.32026205386208667, "3": 0.017640522652780235, "2": 0.002353642855014563, "1": 0}, "score": 4.637290009414078}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.391709321909087, "3": 0.2727040057553335, "5": 0.17098027158212048, "2": 0.15184750778086595, "1": 0.012697540064343683}, "score": 3.5564614176900786}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7793241260461989, "3": 0.2021573953675676, "1": 0.010282087246726766, "4": 0.00788227272356802, "5": 0.0003442785120880585}, "score": 2.2086747424853783}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9978807757333548, "4": 0.0021047482819911497, "3": 7.232013993025191e-06, "1": 0, "2": 0}, "score": 4.997880772338401}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9699572603017835, "4": 0.029715413343383627, "3": 0.0003072351938312065, "2": 5.572677050534973e-06, "1": 0}, "score": 4.9696529576447555}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962337514720515, "4": 0.003747420283981098, "3": 9.665100954390214e-06, "1": 0, "2": 0}, "score": 4.99623321499852}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8662470620990703, "4": 0.1323304203068402, "3": 0.0013815475432075706, "2": 3.144407458628669e-05, "1": 0}, "score": 4.864810864574486}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9980192039708952, "4": 0.0019429452248563167, "3": 3.105384266236666e-05, "1": 3.463634800255132e-06, "2": 1.8356810516532562e-06}, "score": 4.997975582475602}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5085875221576747, "4": 0.2600069545643282, "2": 0.1885242562502503, "5": 0.02682935916088513, "1": 0.016027817060789668}, "score": 3.0930880250798287}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5590037485698828, "5": 0.29641558676986074, "3": 0.13681559250352787, "2": 0.0073534528540970265, "1": 0.0003644848394902136}, "score": 4.143806412277706}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.48077494893459477, "3": 0.2493604347652881, "2": 0.13208669390084443, "5": 0.12678859320204136, "1": 0.010934022726444632}, "score": 3.580429497491991}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7927120008863479, "4": 0.18541213034947576, "3": 0.014546323466631907, "1": 0.005466642246137726, "2": 0.001703026017443339}, "score": 4.758480962332992}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6438246130200773, "3": 0.2688917491202847, "4": 0.07811224095804987, "1": 0.006252199232050402, "5": 0.0029167520308179587}, "score": 2.427615333689405}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6557634169364587, "5": 0.3105611054593673, "3": 0.032893562797668204, "2": 0.0007473305256074823, "1": 2.4201184009163007e-05}, "score": 4.276103144864161}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9913709894785246, "4": 0.008574813803872441, "3": 5.063264659964264e-05, "2": 7.647888915206862e-07, "1": 0}, "score": 4.991321602242969}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9135185014527389, "4": 0.0856724992878955, "3": 0.0007813904477116443, "2": 2.143618877335689e-05, "1": 3.2827108442720224e-06}, "score": 4.9126870280801755}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.988149347718145, "4": 0.01179694121713978, "3": 3.6046636484031225e-05, "2": 1.3246689219172414e-06, "1": 0}, "score": 4.988126797497856}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9451966631373921, "1": 0.0529889594178982, "3": 0.0018064409417411797, "4": 5.512975844053558e-06, "5": 0}, "score": 1.9488283834597304}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5420663868933988, "3": 0.2103236172323522, "5": 0.17148508227134673, "2": 0.06905601445663119, "1": 0.0070543276459340805}, "score": 3.8018835663342503}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6200041359984554, "4": 0.3724559698104698, "3": 0.007337236543192268, "2": 0.0001607971379815511, "1": 2.3048358633866016e-05}, "score": 4.6122876785518265}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.509611932283139, "3": 0.31365096116288577, "5": 0.09298264650134068, "2": 0.0784951295553082, "1": 0.005229039864877415}, "score": 3.606642391582468}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5420857932174208, "4": 0.4390396724256483, "3": 0.01765613436316035, "2": 0.0010503193691133183, "1": 0.00013631952218332464}, "score": 4.521936638832554}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9203590898847978, "1": 0.07872454434062891, "3": 0.0009131516412299159, "4": 1.3067505479901442e-06, "5": 0}, "score": 1.9221910723902869}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6580697040899177, "5": 0.25889458703354734, "3": 0.080664338780737, "2": 0.0023096469537573455, "1": 4.3159241149179785e-05}, "score": 4.1734846971745725}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6119453180825719, "3": 0.3308944952114462, "5": 0.03373975038782532, "2": 0.023065059091968022, "1": 0.0003535831079416916}, "score": 3.6556537698707636}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9864080560919049, "4": 0.013511650036660468, "3": 7.713780965500593e-05, "2": 1.8297906437093673e-06, "1": 6.242355848521801e-07}, "score": 4.98632607843018}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.533412837617217, "5": 0.44656210294268, "3": 0.01682338661792902, "2": 0.0030740920180804838, "1": 0.00012169021059879036}, "score": 4.42322795472063}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.81947695663815, "3": 0.15235205270923494, "4": 0.02163615978186488, "1": 0.004681959781387362, "5": 0.001851054134009909}, "score": 2.1964959319179425}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8624332623981952, "4": 0.13380747043487565, "3": 0.003632533283005783, "2": 0.00010574711729829784, "1": 1.241990662007109e-05}, "score": 4.8585593303183225}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5054711724206931, "5": 0.45711352745503514, "3": 0.035757901975030766, "2": 0.0014674276632224074, "1": 0}, "score": 4.418500272853792}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9976641892614295, "4": 0.002325757933880803, "3": 8.696203559614573e-06, "2": 2.342785605236354e-07, "1": 0}, "score": 4.997656144192756}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5054575602653083, "4": 0.44682343607309905, "2": 0.024267744432661515, "5": 0.023272054870535804, "1": 0.00017864025910542663}, "score": 3.4687427852807704}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5261715756415656, "4": 0.19868444824525186, "3": 0.18149593903324918, "2": 0.0841751611056327, "1": 0.009389586715400123}, "score": 4.148168895128317}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8854637056566406, "4": 0.05364392233070266, "1": 0.037248388382196435, "3": 0.012505878065056349, "2": 0.010664167384585137}, "score": 4.740235153377796}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.989981400899679, "4": 0.00998217177108228, "3": 2.7712333254994484e-05, "2": 4.4824942824008397e-07, "1": 0}, "score": 4.989960975824054}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9471318238050509, "4": 0.05079520594562764, "3": 0.0017977183526546095, "2": 0.00012423072944823876, "1": 0}, "score": 4.945228393488772}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8641483271244285, "4": 0.13321938479107467, "3": 0.0024328740107969603, "2": 0.0001284195396919679, "1": 0}, "score": 4.86151977722937}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8352295848562348, "3": 0.11179905174561668, "1": 0.03275492324851815, "4": 0.016428550066090036, "5": 0.003773938982596294}, "score": 2.123224764698199}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8633605399479308, "4": 0.12761193218778596, "3": 0.008439375213085503, "2": 0.0004915135746197752, "1": 9.219920960982704e-05}, "score": 4.853665330117278}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7193150422371608, "4": 0.2649226983207324, "3": 0.014617667194670624, "2": 0.0010214684807825748, "1": 0.00010621980274645875}, "score": 4.702347651132031}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982286933186519, "4": 0.0017418308609730673, "3": 2.780913483652655e-05, "2": 1.094522897161437e-06, "1": 5.159933289189858e-07}, "score": 4.998197203226083}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3797002322794123, "4": 0.32938819492353477, "5": 0.2219127261176842, "2": 0.06303712754903001, "1": 0.005956473307344427}, "score": 3.6982672359815068}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7596900407575892, "2": 0.2359779288858684, "3": 0.004036781350339856, "5": 0.00012795703684961236, "4": 0.00011894397191131016}, "score": 1.2449319936210816}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6363058913656927, "4": 0.30105157000142313, "3": 0.04673209926481937, "2": 0.013011782315888763, "1": 0.0028267611293576185}, "score": 4.555109854216258}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"2": 0.554879281336544, "3": 0.36859577356315903, "4": 0.05054138870777506, "1": 0.022239537626305043, "5": 0.003715664675971883}, "score": 2.4585990105380504}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.527551282683483, "5": 0.4301536966883271, "3": 0.03614863826878979, "2": 0.005762579930228962, "1": 0.00035332844306645774}, "score": 4.381431536969237}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.768972938963572, "3": 0.13622067472234736, "1": 0.06804628116126965, "4": 0.021606292225013334, "5": 0.00467919122105911}, "score": 2.125484109156338}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6676565863010336, "1": 0.32484413379978777, "3": 0.007122699372905889, "4": 0.00024984183507890365, "5": 0}, "score": 1.6827380398776846}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7671995361609237, "5": 0.18319852098512426, "3": 0.04620142209920993, "2": 0.003204241109353979, "1": 0.00011636788067073865}, "score": 4.1302499215262785}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5767760304270293, "4": 0.4191963135610571, "3": 0.0038303733504701214, "2": 0.00013639083594034834, "1": 0}, "score": 4.572707748624973}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.980757384969849, "4": 0.0191532991274087, "3": 7.90104054194934e-05, "2": 6.798850528483292e-06, "1": 2.123346873975757e-06}, "score": 4.9806597633693235}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6468786694272183, "4": 0.3449499655015589, "3": 0.00745794329872338, "2": 0.0006240535350035245, "1": 8.186974903411507e-05}, "score": 4.637931793335578}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7383506881885599, "5": 0.19095833807310228, "3": 0.06375037580376226, "2": 0.006708830736758128, "1": 0.00012333787713963927}, "score": 4.113432586582711}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5156942128085101, "3": 0.4244299519165105, "4": 0.05783281100025488, "1": 0.0014075843088901681, "5": 0.0006314877592323463}, "score": 2.54058458938781}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9527973178156045, "4": 0.0464209923836736, "3": 0.0007492314576162469, "2": 1.513192208846049e-05, "1": 0}, "score": 4.952034317861226}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7952142530060798, "4": 0.2025319352361039, "3": 0.0021815193399571577, "2": 5.2237182929274926e-05, "1": 1.2331741621907436e-05}, "score": 4.792897388013068}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9956281176231897, "4": 0.004364123114589952, "3": 7.407733765860063e-06, "2": 1.1913804191991375e-07, "1": 0}, "score": 4.995620702986046}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.49498055500659316, "2": 0.2522141123596504, "4": 0.21618654710915933, "5": 0.03347601053863176, "1": 0.0030032372162815046}, "score": 3.0249214588789988}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.42500028052462363, "3": 0.206437205998348, "4": 0.17644278843487185, "5": 0.17109609863665, "1": 0.020678191185900904}, "score": 3.05229638782596}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9974667890079527, "4": 0.0024482166926749387, "3": 6.54629646779535e-05, "2": 2.725420036207936e-06, "1": 0}, "score": 4.99741263763487}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8966185394237031, "4": 0.06372969216291616, "3": 0.02884975437295425, "2": 0.0072537645253548215, "1": 0.0034314135122448203}, "score": 4.8430655158683}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5319690329900513, "4": 0.24558277979709117, "3": 0.13484498763726116, "2": 0.05178923343838791, "1": 0.035265222463676825}, "score": 4.18785299422712}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5748621534820784, "3": 0.38947007339972445, "2": 0.02479074948578911, "5": 0.01076223964996849, "1": 0.00011036273791273391}, "score": 3.571377684020859}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7407024028072126, "3": 0.22047453021411062, "4": 0.022016555189562328, "1": 0.01414274510221283, "5": 0.0026604420121820018}, "score": 2.258347080447576}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9111881333822294, "4": 0.08782215283256804, "3": 0.0008174185444285472, "1": 9.996254421404983e-05, "2": 6.117566978644573e-05}, "score": 4.909958628298365}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9313372988038925, "4": 0.06774746749964636, "3": 0.0008893737451996248, "2": 1.9384612048802247e-05, "1": 3.970414740824956e-06}, "score": 4.930399575171037}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8978596900932346, "4": 0.10164362053516916, "3": 0.00045236544416778484, "2": 2.2162275862106892e-05, "1": 1.1852781407412159e-05}, "score": 4.897336692280569}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9480621403338307, "4": 0.050169610706691764, "3": 0.0016041889134625611, "2": 0.00012112118313926292, "1": 2.9383419655479048e-05}, "score": 4.9461403841473786}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7227514296628403, "4": 0.2684142722500815, "3": 0.008657900692983538, "2": 0.0001498168514825647, "1": 1.646049977788193e-05}, "score": 4.713751736965709}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9828288085851704, "4": 0.01703293255121981, "3": 0.00012906673006809604, "2": 2.3795956016291444e-06, "1": 0}, "score": 4.98270167735636}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.995193806289789, "4": 0.0047478233882952275, "3": 5.103672940686449e-05, "2": 1.504203553758088e-06, "1": 0}, "score": 4.995145562243823}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7299716800823226, "4": 0.20308584653456702, "3": 0.05041927684233762, "2": 0.013194463093532982, "1": 0.0031310915412513397}, "score": 4.643897463551121}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"5": 0.3095118809604269, "4": 0.2699507618857763, "2": 0.20235390694277094, "3": 0.13500776279658092, "1": 0.08301499706312754}, "score": 3.5206742900721975}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9829989136233763, "4": 0.01648813908336253, "3": 0.0004494057515537473, "2": 3.7999559135597136e-05, "1": 1.20857558655668e-05}, "score": 4.982450471562227}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5002945019773456, "5": 0.4237514069741542, "3": 0.06839829373907041, "2": 0.007203203653837531, "1": 0.000344107654644984}, "score": 4.339917267501727}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964237993919971, "4": 0.0035369998894998534, "3": 3.443031953301727e-05, "2": 1.634594167535924e-06, "1": 1.4795049786829218e-06}, "score": 4.996383311678697}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997599404449249, "4": 0.0023686455146895535, "3": 3.0373622716446508e-05, "2": 1.116968766745521e-06, "1": 3.167214994030738e-07}, "score": 4.997565989100191}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4769395145559589, "3": 0.34311016590089677, "1": 0.08091221317463738, "4": 0.07926539709383042, "5": 0.01857652671186531}, "score": 2.4770289407503983}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8161633665098491, "1": 0.1777625158712273, "3": 0.006013345678814163, "4": 3.96320667885871e-05, "5": 0}, "score": 1.828326464784377}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5907612024483222, "4": 0.4023764845102419, "3": 0.006766840447741766, "2": 7.343594707956374e-05, "1": 0}, "score": 4.583860356430769}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5254798152311909, "4": 0.44432600521361654, "3": 0.02844867193975695, "2": 0.0016135896267221892, "1": 0.00011665648119535016}, "score": 4.493461525561186}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5423155778645138, "4": 0.43592325577104185, "3": 0.02062743485816445, "2": 0.001007984990319376, "1": 9.201674376767837e-05}, "score": 4.519413642498242}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"1": 0.792790816231322, "2": 0.20715926197857723, "3": 4.6211170656551914e-05, "5": 7.854218248386397e-08, "4": 0}, "score": 1.2072527512466256}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6233236329718194, "3": 0.21393958861605786, "4": 0.08036135319627824, "1": 0.05428112599683845, "5": 0.028059450150264852}, "score": 2.4045736184764115}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9967324510955664, "4": 0.00318434710994306, "3": 5.0067322909905094e-05, "1": 4.6606669395141775e-06, "2": 0}, "score": 4.996696781521281}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"1": 0.9153966320322755, "2": 0.07406942869710374, "3": 0.007353347700473062, "5": 0.0025571582388911563, "4": 0.0006152954493920581}, "score": 1.1008514641190916}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"1": 0.9445379970931091, "2": 0.05468076372780445, "3": 0.0007439475670572759, "5": 2.5783933308510378e-05, "4": 7.700887315226988e-06}, "score": 1.0562951115608454}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3928500704617027, "3": 0.3914058295629038, "2": 0.13353235112163325, "5": 0.08102761957691064, "1": 0.001129886605961267}, "score": 3.419135920333752}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9486062252445955, "4": 0.04610683386243225, "3": 0.0041985770865979105, "2": 0.0009676205900004702, "1": 8.892795592766595e-05}, "score": 4.942235600581249}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.930225117778245, "4": 0.06862082629626175, "3": 0.0011069630547745123, "2": 2.408349034850471e-05, "1": 0}, "score": 4.929091365559402}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7681143374711293, "4": 0.19670335446919, "3": 0.03190283186289292, "2": 0.0029818182903277677, "1": 0.00021905504778160125}, "score": 4.7296480563072905}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998314578620528, "4": 0.0016463415421228635, "3": 2.446199180276323e-05, "2": 2.5773907705845542e-06, "1": 0}, "score": 4.9982969817968455}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8846234064257421, "2": 0.11517453563378213, "3": 0.00019958506929820659, "5": 9.866139586603511e-07, "4": 7.75779893030042e-07}, "score": 1.1155800616849054}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5404904883121975, "4": 0.4436635384972229, "3": 0.015324904941769696, "2": 0.0004937112627581884, "1": 2.343120211740361e-05}, "score": 4.5241099247808805}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7517982617291878, "5": 0.17298698820514452, "3": 0.07445031416865314, "2": 0.000740466251930932, "1": 0}, "score": 4.097058067980071}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.45848339677108146, "3": 0.3230519282840858, "4": 0.15439623907664723, "1": 0.042561737928341725, "5": 0.021372504917040954}, "score": 2.6534878767737107}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8366075963407682, "4": 0.16135993308986, "3": 0.002001104501713154, "2": 2.5959887492936654e-05, "1": 0}, "score": 4.834559083840835}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6536830029511659, "1": 0.3318819983172432, "3": 0.01402074023874837, "4": 0.00037149045027184415, "5": 4.231939780821474e-05}, "score": 1.6830085387989147}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9750722969649867, "4": 0.02482945820195418, "3": 9.268137708675173e-05, "2": 7.709479310266571e-07, "1": 0}, "score": 4.97498274630469}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7190760751310754, "4": 0.27392139316854075, "3": 0.006913644197310746, "2": 7.214597939053789e-05, "1": 0}, "score": 4.712030059443087}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986549588797473, "4": 0.0013321794416285059, "3": 1.1709618030182821e-05, "2": 2.9626781834308923e-07, "1": 0}, "score": 4.998643511357982}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8186301536240007, "4": 0.15820487637635938, "3": 0.019115525895936486, "2": 0.003436893389743804, "1": 0.0005966004091983117}, "score": 4.790863654237291}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7130729140868522, "1": 0.21957939575521881, "3": 0.06097872781326588, "4": 0.0040750388442640775, "5": 0.0017467956965064916}, "score": 1.8547103048042342}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.653362482728365, "3": 0.26094464037499504, "4": 0.050154291246982494, "1": 0.02820100114704432, "5": 0.007286023901002748}, "score": 2.354928593756747}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5951126283531633, "4": 0.39495952013634444, "3": 0.009699386916061821, "2": 0.00013117896789276574, "1": 0}, "score": 4.585207815810332}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6814427890082688, "4": 0.20640102072786812, "3": 0.10061177303327423, "2": 0.008285035029912468, "1": 0.0030550528102819044}, "score": 4.555209233048453}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8758945605141789, "4": 0.11888701389064911, "3": 0.004918727599072679, "2": 0.00022069321241001714, "1": 4.9629507095398857e-05}, "score": 4.870411126536593}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8561418790680638, "1": 0.12664273081960672, "3": 0.016985300252776312, "4": 0.0001777108085409114, "5": 4.768126521546463e-05}, "score": 1.8908405220380524}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7964471377561776, "4": 0.1776283558235354, "3": 0.019433886691654387, "2": 0.005800225400672297, "1": 0.0006105258029697208}, "score": 4.76364221383151}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8895432057332051, "4": 0.09517713924525613, "3": 0.011582250291792254, "2": 0.002766960095104475, "1": 0.000781049523315377}, "score": 4.870213892382589}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9769938233662737, "4": 0.022471640207737627, "3": 0.00046472705649217407, "2": 3.352259060448786e-05, "1": 0}, "score": 4.976497485076902}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7628486950873952, "4": 0.2300162546879097, "3": 0.0068690669301475216, "2": 0.0001999556432027886, "1": 3.357761275891355e-05}, "score": 4.755503500150297}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9005384831189667, "1": 0.05142653472196282, "3": 0.045642097388215605, "4": 0.0022823414755978617, "5": 0.00010309104790032896}, "score": 1.999089511975968}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7084940130950135, "4": 0.2864672098966008, "3": 0.00482574911136857, "2": 0.00012141307297557172, "1": 0}, "score": 4.703489887939993}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5759336015602141, "4": 0.4085827397107635, "3": 0.01519463308489036, "2": 0.00026533244733056215, "1": 0}, "score": 4.560221577020739}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8733516393735792, "4": 0.12522855139860634, "3": 0.0013946253027046864, "2": 2.0082053548865576e-05, "1": 3.172203820844085e-06}, "score": 4.871909015847014}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5947064241444222, "5": 0.3685762385048438, "3": 0.03462953667336267, "2": 0.0019328010634728117, "1": 0.00013551692739807562}, "score": 4.329680971993365}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6796921662508449, "5": 0.2593466746835275, "3": 0.054133557441611066, "2": 0.0065672723507826675, "1": 0.00022584333658910743}, "score": 4.191407643402447}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9171086312513655, "4": 0.0807097575189413, "3": 0.0019938686145690348, "2": 9.793603465520421e-05, "1": 0}, "score": 4.915001063684141}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8969873675691887, "4": 0.09864467763213945, "3": 0.004143769906747549, "2": 0.00013933603839192082, "1": 0}, "score": 4.892640665122709}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9544199044089368, "4": 0.044547631119643036, "3": 0.000985387788855398, "2": 3.406697902069067e-05, "1": 1.0424403605722777e-05}, "score": 4.953337574114795}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.2799527052223369, "2": 0.2762086833140106, "3": 0.23400385251983105, "1": 0.13076745315661462, "5": 0.07903419279222447}, "score": 2.900274198959597}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6477387159952682, "1": 0.35132073423610627, "3": 0.000936818029527237, "4": 2.447121798794802e-06, "5": 1.1295852816422062e-06}, "score": 1.6496243124734136}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9369106020438037, "4": 0.05978911248916776, "3": 0.0024291749646501294, "2": 0.0006982865565362149, "1": 0.00016893796186352662}, "score": 4.932581664077895}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.47731401133296775, "4": 0.22436255196188476, "3": 0.15072615977405202, "2": 0.1397090127175895, "1": 0.007862728463632443}, "score": 4.023582242923097}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9489205277780383, "4": 0.050654748573340916, "3": 0.0003934321232119094, "2": 2.8537230210842588e-05, "1": 2.6349561960475504e-06}, "score": 4.948462229514354}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5822233744430432, "5": 0.37518175140993776, "3": 0.038794476528484036, "2": 0.0036952886816068045, "1": 0.00010454593643894254}, "score": 4.32868324475775}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8435643758426764, "2": 0.15627664139061478, "3": 0.00014467264333641445, "4": 6.223544818693046e-07, "5": 0}, "score": 1.156569996834665}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9794763929607745, "4": 0.019544731839303567, "3": 0.0008523746480744297, "2": 8.38635067816679e-05, "1": 3.169131149438262e-05}, "score": 4.978371926363093}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9765131922773779, "4": 0.023271314830957606, "3": 0.00019607976837954206, "2": 4.6998827329297865e-06, "1": 0}, "score": 4.976322077605117}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987814570271567, "4": 0.0011564126601307568, "3": 4.7707067758904874e-05, "1": 8.445785486592173e-06, "2": 4.191910338042572e-06}, "score": 4.9987018120134135}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6666827389325114, "1": 0.2884882562793313, "3": 0.03940165336421255, "4": 0.004108336816057277, "5": 0.0013126950040766607}, "score": 1.7630666584043773}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9008358494876565, "3": 0.052055475111038106, "1": 0.04619466332557317, "4": 0.0008088100213027635, "5": 0.00010031743997457646}, "score": 2.0077794221474714}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9926558130141827, "4": 0.007274824426719986, "3": 6.179469738584146e-05, "2": 1.8653068268163032e-06, "1": 0}, "score": 4.992595948036016}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9650802263353083, "4": 0.034716999946296775, "3": 0.00018108301236265703, "2": 2.9408026607930615e-06, "1": 0}, "score": 4.964911353712268}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9323452061595497, "4": 0.06697033626124434, "3": 0.0006111486736476528, "2": 5.2095447138520066e-05, "1": 0}, "score": 4.931649630102315}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.711401863491821, "5": 0.20332499896899953, "3": 0.07332856105046691, "2": 0.011424519499760815, "1": 0.0004110632756356748}, "score": 4.105925754333405}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"4": 0.46351178879789867, "3": 0.3297459069655118, "2": 0.13694509498708546, "5": 0.06592050055757076, "1": 0.003835944079049795}, "score": 3.450754181587574}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7891112474816147, "3": 0.1601547730098787, "1": 0.03422395984302235, "4": 0.015147935908077918, "5": 0.0013329047442717915}, "score": 2.160230074571278}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9700530541310117, "4": 0.029111761826161656, "3": 0.000729811409754604, "2": 3.549609029795143e-05, "1": 0}, "score": 4.9693199832699335}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5449608291615289, "3": 0.29686196871837695, "5": 0.1315228076760882, "2": 0.02610100394676418, "1": 0.0005084180071600317}, "score": 3.7809237246370824}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7811154396609856, "4": 0.2144287207575358, "3": 0.0043480056946800915, "2": 8.610164853206546e-05, "1": 1.6526837223165525e-05}, "score": 4.77654969241015}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7781057177793426, "5": 0.1451149053057651, "3": 0.07251369778514166, "2": 0.004086007283655774, "1": 0.000125591372069986}, "score": 4.06405588300962}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.943357058477238, "4": 0.05497430416061242, "3": 0.0015198692006965116, "2": 8.556416462740911e-05, "1": 0}, "score": 4.941725581767967}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9642366817685731, "4": 0.035220196384241294, "3": 0.0004753876412049975, "2": 5.515027052568678e-06, "1": 0}, "score": 4.963810231554513}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9857918501400541, "4": 0.014020752857420275, "3": 0.0001725992715112971, "2": 4.330844501405907e-06, "1": 0}, "score": 4.985620905561703}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9819026146135689, "4": 0.0178170092876536, "3": 0.00025203262866629693, "2": 8.12315445134116e-06, "1": 0}, "score": 4.9816541850334914}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"4": 0.48490717408593537, "5": 0.4223244590752294, "3": 0.08824771286927821, "2": 0.00420057020421261, "1": 0}, "score": 4.325779882649038}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.8545824858124033, "2": 0.12817496940621706, "3": 0.014013688178428782, "5": 0.00201688507463455, "4": 0.0011463056338987313}, "score": 1.1677198164350668}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8504439259564418, "4": 0.1422161778215582, "3": 0.006623131398174801, "2": 0.00035772429283971495, "1": 0}, "score": 4.843408163687514}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5305963586524657, "4": 0.4351765230905188, "3": 0.03321309676411399, "2": 0.0008958330414677146, "1": 0}, "score": 4.4956501759321625}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7659998921790316, "4": 0.2267558933061107, "3": 0.007107611691253618, "2": 0.00012179503098881841, "1": 8.549583411532645e-06}, "score": 4.758627789326978}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7161570804354989, "3": 0.2653425357320662, "4": 0.014611125790909674, "1": 0.0031447307643944636, "5": 0.0007064368811704341}, "score": 2.2935505486496344}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.34288731962556235, "4": 0.3255407607939842, "3": 0.15405433717542782, "2": 0.12660904833317796, "1": 0.050757169505181214}, "score": 3.783310578167798}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5169379867123997, "4": 0.4561613702235743, "3": 0.02569037938913363, "2": 0.0011267367003648867, "1": 6.161624528711251e-05}, "score": 4.488819995589245}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.4749210354143731, "3": 0.3210596973788974, "5": 0.18319093672335077, "2": 0.0199747001241637, "1": 0.000792009635649294}, "score": 3.81979470580856}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5153946299536757, "5": 0.42253770228022725, "3": 0.05891525049632125, "2": 0.0029299192970542102, "1": 0.00017257148526543653}, "score": 4.357262735607488}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.47760876256161117, "3": 0.3179746234048112, "2": 0.17123893792236494, "5": 0.031964975219573186, "1": 0.0011459778373645749}, "score": 3.368032375647839}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5192050640897963, "2": 0.39929287851325185, "4": 0.04536184254078271, "5": 0.018854561593761976, "1": 0.01712850918352416}, "score": 2.6494659845030237}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5093833003266348, "4": 0.39432950976647413, "2": 0.0778160632967272, "5": 0.017988133292899146, "1": 0.00047765893751134547}, "score": 3.351536270408486}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9856921107950716, "4": 0.014197008579259627, "3": 0.00010723209076220836, "2": 1.8464863408507508e-06, "1": 0}, "score": 4.98558296179999}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.4607240063388946, "4": 0.34641822191384514, "2": 0.11440251683185379, "5": 0.07236859821421003, "1": 0.006081085881621807}, "score": 3.364592760827657}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"5": 0.994952769688418, "4": 0.004917660842750346, "3": 0.00011478967696840814, "2": 9.161973086662003e-06, "1": 0}, "score": 4.9948252448132155}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9930979177424246, "4": 0.006692960343179773, "3": 0.00018262658663342632, "2": 9.44613400653837e-06, "1": 0}, "score": 4.992913327259477}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9874940890469652, "4": 0.012283971456974501, "3": 0.00017218208627197977, "2": 2.652022504014507e-06, "1": 0}, "score": 4.987363113037515}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999347227208922, "4": 0.0006443456192273614, "3": 4.470452160411899e-06, "1": 2.1690573038143164e-07, "2": 0}, "score": 4.999345843407106}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9425110524418269, "4": 0.05575335450270335, "3": 0.0016397940898470928, "2": 6.308049176536092e-05, "1": 1.6797457874477837e-05}, "score": 4.940709682048707}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7866760041648144, "3": 0.12788041622328603, "5": 0.07709892048518846, "2": 0.008270982285789721, "1": 6.644380534165336e-05}, "score": 3.932476719876011}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.983457234566308, "4": 0.015767380473759873, "3": 0.00076491457273554, "2": 7.97260713567072e-06, "1": 1.213213419439542e-06}, "score": 4.98267399744928}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9828747559231307, "4": 0.01700139975136408, "3": 0.00010936036805701199, "2": 1.5369770887385771e-06, "1": 0}, "score": 4.982775045570109}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9590851112852435, "4": 0.04052593254610963, "3": 0.0003832548827174867, "2": 3.410277130601359e-06, "1": 0}, "score": 4.95869723223206}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939665888673432, "4": 0.005817023931498508, "3": 0.00019693733032793607, "2": 1.1172155402275177e-05, "1": 6.701735736296806e-06}, "score": 4.993728768115361}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6898158369408831, "1": 0.3080155531633203, "3": 0.0021647573550458124, "4": 2.829000751509364e-06, "5": 1.0507619398043762e-06}, "score": 1.6941580228046598}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.992113778704184, "4": 0.007779626108345033, "3": 9.492656170436675e-05, "2": 3.550010488408665e-06, "1": 0}, "score": 4.992019805948655}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.993216440921434, "4": 0.006710375958402247, "3": 6.427971183951009e-05, "2": 1.387862172724492e-06, "1": 0}, "score": 4.993156849601387}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.977188661221889, "4": 0.0217547468343936, "3": 0.0009323051338747689, "2": 8.265262283169279e-05, "1": 3.7636715799107124e-05}, "score": 4.97598204215507}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.987278510034884, "4": 0.012426793143846588, "3": 0.0002780220863853777, "2": 1.095127138743801e-05, "1": 4.249088791565197e-06}, "score": 4.986967293298961}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6127211748186895, "1": 0.3810623572212818, "3": 0.006065914286301303, "4": 8.381907089962243e-05, "5": 4.377082755677273e-05}, "score": 1.6252939030228852}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.378266993759877, "4": 0.29180797876539, "3": 0.2119753891423813, "2": 0.11471497561847785, "1": 0.0031625497304773806}, "score": 3.9273687665341748}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.935668249150151, "4": 0.06226356224359377, "3": 0.0020307136418449222, "2": 2.5509184351467135e-05, "1": 0}, "score": 4.9335976883642045}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9752366719299593, "4": 0.024238485478327833, "3": 0.000493163004815242, "2": 1.895547026035206e-05, "1": 7.27286688198552e-06}, "score": 4.9746890926576555}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.760158306018414, "1": 0.17118207891304202, "3": 0.06359430224449211, "4": 0.00378982664893935, "5": 0.0012697280948211892}, "score": 1.9038005069893877}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7608682983703774, "3": 0.14314028723527328, "4": 0.05330968270768574, "1": 0.036662102018938096, "5": 0.005853982969055414}, "score": 2.2306977138535635}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996670928458881, "4": 0.0003287762926591255, "3": 2.0389165380406298e-06, "1": 1.2321069248032075e-07, "2": 0}, "score": 4.999666652375222}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8931351372924364, "4": 0.10449751372140226, "3": 0.002284728682952328, "2": 7.381452721483168e-05, "1": 4.657121521175984e-06}, "score": 4.890692503365928}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982075457683247, "4": 0.0017855842613932777, "3": 6.137684525751664e-06, "2": 1.481545279668046e-07, "1": 0}, "score": 4.998201694855524}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.844895920683386, "4": 0.14523194411442716, "3": 0.009180386250656156, "2": 0.0005998346044494738, "1": 7.059219302231576e-05}, "score": 4.834321878184385}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8927519805748383, "4": 0.10323400235678, "3": 0.0031593164123205693, "2": 0.0006909692057160444, "1": 0.00014025603278174082}, "score": 4.887810799381971}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9925869849441915, "4": 0.007289891620095493, "3": 9.039189063092824e-05, "2": 1.670250249112425e-05, "1": 0}, "score": 4.992479096538288}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9995731098635341, "4": 0.000420034124994734, "3": 2.28785239317562e-06, "1": 0, "2": 0}, "score": 4.999575388230525}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981002976230805, "4": 0.0018566128495701726, "3": 2.1901137102525397e-05, "1": 1.292178505494407e-06, "2": 0}, "score": 4.998094378247549}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987176125624164, "4": 0.0012554477463822312, "3": 1.4730608766503098e-05, "1": 1.5432515057071741e-06, "2": 0}, "score": 4.998708904259453}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5377278509822965, "2": 0.44212802036801846, "3": 0.019092688848703094, "4": 0.0005687093857040687, "5": 0.00041781679959185133}, "score": 1.483722193577477}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6607491578731673, "5": 0.31888667184222463, "3": 0.01923409487562898, "2": 0.0010433941229366513, "1": 0}, "score": 4.297591584341968}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9285994181360011, "4": 0.07070595362049042, "3": 0.0005931691233795417, "2": 5.246572283387794e-05, "1": 0}, "score": 4.927946780832256}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8034780678063059, "3": 0.11794925374786173, "5": 0.061583863433982367, "2": 0.01675123989279859, "1": 0.0001755081635826045}, "score": 3.9095999945566637}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5658267177716836, "3": 0.2630726366382762, "2": 0.10254530274983817, "5": 0.06328728746106656, "1": 0.005184414839925846}, "score": 3.579535632936957}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8206835322833671, "1": 0.15193370569787715, "3": 0.02678318536832584, "4": 0.0004719988541641459, "5": 0.00011980429757657598}, "score": 1.8761519275386775}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5652212452339637, "1": 0.22132778195875688, "3": 0.16230595724344435, "4": 0.03727206352897207, "5": 0.013549270103603914}, "score": 2.0561882997908336}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9070330597248605, "4": 0.09041359822983416, "3": 0.002394962753535252, "2": 0.0001433853208645071, "1": 1.1139034465246815e-05}, "score": 4.9043213953277}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8956010427096573, "4": 0.10036067818337717, "3": 0.0037244488419152584, "2": 0.00019536967985930826, "1": 0}, "score": 4.89159147295566}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6809292156579971, "4": 0.25808951419268733, "3": 0.05540095760995724, "2": 0.004959035563472743, "1": 0.00054186015847972}, "score": 4.614033371021763}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6297404554235259, "2": 0.31798915517714926, "4": 0.05109955450051563, "5": 0.0006963988509898633, "1": 0.0004737247979130302}, "score": 2.7335555579209356}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.710480569117364, "5": 0.16283445626313178, "3": 0.11975054398849629, "2": 0.00625749083063131, "1": 0}, "score": 4.030589637956784}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9601973046122454, "4": 0.03968230137045279, "3": 0.00011434835765940262, "2": 1.012002010946186e-06, "1": 0}, "score": 4.960085764993602}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9721133646734557, "4": 0.027775001207002745, "3": 0.00010984810610715817, "2": 1.03037370617234e-06, "1": 0}, "score": 4.9720021903034075}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5707716852432988, "5": 0.41880829231612793, "3": 0.010324057784888156, "2": 9.069185558216314e-05, "1": 2.802871865974687e-06}, "score": 4.408295450664939}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"4": 0.692891034173692, "5": 0.23926635297313628, "3": 0.06290493251423387, "2": 0.004731857724460817, "1": 0.00011389620577071653}, "score": 4.166571328696709}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9311480051106809, "3": 0.06646860819449875, "1": 0.001917619894904248, "4": 0.0004532025056638102, "5": 1.1157819560318763e-05}, "score": 2.0654909588809796}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.712876746193325, "4": 0.2599960345015595, "2": 0.019213104629144807, "5": 0.007867615094701652, "1": 3.6517827206352546e-05}, "score": 3.256447684205119}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9042012099303894, "4": 0.09473068576192249, "3": 0.0010282304129019184, "2": 1.5150909421328962e-05, "1": 0}, "score": 4.903165006633886}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.7193237244221174, "2": 0.17555845756507474, "4": 0.09694299050600828, "5": 0.004945885303010807, "1": 0.0031515590880624293}, "score": 2.9249673791128457}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"3": 0.44504082030520375, "4": 0.3952586572130913, "2": 0.12285407623246083, "5": 0.03619430836493255, "1": 0.0006442660474570448}, "score": 3.343507369649554}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8906138721778298, "3": 0.0971772935751128, "1": 0.0073827653639049326, "4": 0.004672015573933377, "5": 0.00013203850148380783}, "score": 2.099536866148497}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5872489755098629, "5": 0.3984134873717374, "3": 0.013826060854706938, "2": 0.00045058356690239786, "1": 0}, "score": 4.383709624497046}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994047299835382, "4": 0.0005913682725639312, "3": 3.4116790425752174e-06, "2": 1.5925645652307254e-07, "1": 0}, "score": 4.999401330401937}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7438170313489171, "4": 0.23223188550564475, "3": 0.022784645793210653, "2": 0.0011109679684704434, "1": 3.7149137639647875e-05}, "score": 4.718712169189674}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5289572834532754, "1": 0.46970221978357873, "3": 0.0013190506574934906, "4": 1.2228356499522232e-05, "5": 7.80862239153272e-06}, "score": 1.5316640535093726}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5160780062619976, "5": 0.4711364142696613, "3": 0.01218400808273762, "2": 0.0005848769937123686, "1": 1.3006725345561711e-05}, "score": 4.457745320035565}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9566311452372072, "4": 0.04276603783144872, "3": 0.000578215743664825, "2": 1.1123851179591086e-05, "1": 0}, "score": 4.95604356671204}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9668111590177353, "4": 0.03290580806044352, "3": 0.0002737558245951522, "2": 6.652379152411761e-06, "1": 1.8287461314884264e-06}, "score": 4.96651938151875}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.984335870855729, "4": 0.01560403101044871, "3": 5.557878468154973e-05, "2": 1.7529227856007176e-06, "1": 0}, "score": 4.984279509162252}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9150654190800518, "4": 0.07471763029737669, "3": 0.007722091746708821, "2": 0.0013964186877739573, "1": 0.0008028430641835843}, "score": 4.902408710184561}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7641620232370226, "4": 0.22082414901958627, "3": 0.013087462082759922, "2": 0.0014995743167244726, "1": 0.00034889483972745303}, "score": 4.747086923461288}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7964901550277588, "4": 0.2014872248204658, "3": 0.001965869574494022, "2": 4.108134222482e-05, "1": 0}, "score": 4.794454571264234}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"2": 0.29985273745337593, "4": 0.2726511063096291, "3": 0.2166896572511392, "5": 0.12999809272244342, "1": 0.08051268736159166}, "score": 3.071790409358973}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4847277916193264, "4": 0.45763037600036466, "3": 0.04819305767201874, "2": 0.008528429920608543, "1": 0.0008438894967174813}, "score": 4.416978085796814}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8593164769458507, "1": 0.13619565328269048, "3": 0.004438530170610555, "4": 3.233630387261786e-05, "5": 1.2574985437887702e-05}, "score": 1.868344691441257}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.8357058682848991, "3": 0.15484737880855406, "4": 0.004942772847960572, "1": 0.004233329414054617, "5": 0.00025588280788447864}, "score": 2.1612696251175536}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.887784789081987, "4": 0.10907090539835271, "3": 0.0031108623757225068, "2": 2.4543978714947538e-05, "1": 0}, "score": 4.884632711241493}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997917131647154, "4": 0.00019919745280878986, "3": 3.491971784708308e-06, "1": 4.899717992739939e-07, "2": 0}, "score": 4.99979185765335}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.4925633486210327, "4": 0.4085425534888763, "3": 0.07736212184657662, "2": 0.017005779876075877, "1": 0.0044047899728186755}, "score": 4.3680199770088}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9970027921226475, "4": 0.002962155696102305, "3": 2.9357955271043468e-05, "2": 6.598290834056104e-07, "1": 0}, "score": 4.996977133687796}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9991421483652828, "4": 0.0008487490486293318, "3": 7.168658642524843e-06, "1": 3.4816302647016224e-07, "2": 0}, "score": 4.9991355196111185}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9804515481676678, "4": 0.019257717297794196, "3": 0.0002815908294737231, "2": 5.06930414138894e-06, "1": 0}, "score": 4.980163812310252}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9873046574651865, "4": 0.012400884230527468, "3": 0.0002819454346211018, "2": 8.074020471923642e-06, "1": 0}, "score": 4.9870109451823605}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9949021389246995, "4": 0.005051762937905316, "3": 4.133801588101389e-05, "2": 1.2546850161869866e-06, "1": 0}, "score": 4.9948617789635765}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5346233118895114, "3": 0.3489027321731222, "4": 0.10878989779718959, "5": 0.004465909008696537, "1": 0.0031982407051542303}, "score": 2.576693495148398}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5877801885332994, "5": 0.31688289175502116, "3": 0.09016447288098278, "2": 0.004876136858383153, "1": 0.0002696461537886476}, "score": 4.216162970426121}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.782294852710663, "4": 0.21563741845934162, "3": 0.00204246125665497, "2": 1.055910539138213e-05, "1": 0}, "score": 4.780242749418697}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7071997861842674, "5": 0.12286079653422931, "3": 0.11870343966324122, "2": 0.049747354135392656, "1": 0.001439252208398919}, "score": 3.9003399716323917}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6642749060837314, "5": 0.2548514124325866, "3": 0.07612125116078718, "2": 0.004518076178352535, "1": 0.00018958141407100125}, "score": 4.169132837211815}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9464798287218994, "3": 0.04975471728866461, "1": 0.0035176806950131486, "4": 0.00024009521119012703, "5": 7.202481057361521e-06}, "score": 2.046738856688305}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9988590054298703, "4": 0.001134053723021756, "3": 5.814673043335203e-06, "1": 3.032646440298934e-07, "2": 0}, "score": 4.998853102928523}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9981554094521251, "4": 0.00183521727222972, "3": 7.364720194601104e-06, "1": 1.5393321460369482e-07, "2": 0}, "score": 4.998149434122421}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948237959532116, "4": 0.005109992206062883, "3": 5.501096659343268e-05, "1": 3.487710689087443e-06, "2": 0}, "score": 4.9947659946472545}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9826279231842293, "4": 0.017146949378451373, "3": 0.00020811390665655894, "2": 6.4273129483722365e-06, "1": 0}, "score": 4.98241735473568}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9319881397198461, "1": 0.0562709141437895, "3": 0.011598262228268864, "4": 0.00012791865549604823, "5": 1.2570584963112459e-05}, "score": 1.9556207997527664}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5035642843490443, "5": 0.3959969103122053, "3": 0.09586891398055541, "2": 0.004463643134888737, "1": 9.634375316757541e-05}, "score": 4.290914560156944}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8020692726262633, "5": 0.12715268125481602, "3": 0.06808148380050405, "2": 0.0025919390899912264, "1": 7.907118778908675e-05}, "score": 4.053651476615673}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8030541039760146, "4": 0.19238590543668702, "3": 0.004425662474396077, "2": 0.00011814380370673556, "1": 1.1267884029779055e-05}, "score": 4.798362275330496}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6018526085176782, "5": 0.36950359842796066, "3": 0.025962829460501203, "2": 0.002545913892800394, "1": 0.00011424743262454977}, "score": 4.338113232406206}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.46552633978954006, "5": 0.24871057698147817, "3": 0.21213576676834442, "2": 0.06954028875866392, "1": 0.003912778279086745}, "score": 3.885735987420297}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9056585684343176, "3": 0.058926563310411954, "1": 0.03468087141772857, "4": 0.0006224057168325522, "5": 0.00011049160640801976}, "score": 2.025822006537238}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9133985460795704, "4": 0.08462744127603067, "3": 0.0019245405789730984, "2": 2.4340766001708235e-05, "1": 0}, "score": 4.911448229846969}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6771694107022058, "4": 0.3137876172831104, "3": 0.008396069494179013, "2": 0.0004902596545333155, "1": 8.540140545386153e-05}, "score": 4.667584177354412}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7148142215855922, "4": 0.21940555772272838, "3": 0.039113394512600576, "2": 0.013722922076836798, "1": 0.01261502645228393}, "score": 4.610610719781027}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5172388080499758, "2": 0.4728116843988866, "3": 0.00966446038256516, "4": 0.0002133759339123419, "5": 5.4895180510294404e-05}, "score": 1.493008584426504}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6008442076084985, "5": 0.3797327170237989, "3": 0.018617499634714853, "2": 0.0007866891252292582, "1": 1.3819609447132654e-05}, "score": 4.3595022019073335}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8198421559474148, "5": 0.11374627146704387, "3": 0.06613056060593198, "2": 0.00027256402972351644, "1": 0}, "score": 4.047070980454949}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8025973202429184, "5": 0.17844061895984023, "3": 0.018005734292745604, "2": 0.0009229196318540334, "1": 1.9209223570232255e-05}, "score": 4.158533668538068}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.3399241413302707, "4": 0.3218558192562257, "2": 0.28061894431411627, "5": 0.03527638567307127, "1": 0.022199620163556148}, "score": 3.06739883683195}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.46879312777959486, "3": 0.22913312785456025, "4": 0.20590824953813175, "2": 0.08285935720219584, "1": 0.013239289408055606}, "score": 4.034225705223862}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.893857859765797, "3": 0.08788888788262286, "1": 0.016868606299070155, "4": 0.0012062571233025206, "5": 0.00017756967337689367}, "score": 2.0739655654470095}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6276929469881604, "4": 0.3473517929708794, "3": 0.02459495840336841, "2": 0.00033510705835969605, "1": 1.9242618987096666e-05}, "score": 4.602373631915021}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.46234440511730956, "4": 0.33896880380846167, "3": 0.14657326106384239, "2": 0.0436237522756412, "1": 0.008446226545623116}, "score": 4.2031938091973275}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.6030472663521332, "4": 0.21724757003684886, "2": 0.13273013131569755, "5": 0.04336382546819082, "1": 0.0035801234354068366}, "score": 3.164089943258703}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9964933979396053, "4": 0.003415662526309618, "3": 7.448446334739372e-05, "2": 5.825667341559472e-06, "1": 5.397865285783966e-06}, "score": 4.996396281230837}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5131709415094128, "1": 0.22147959846318604, "4": 0.18181201687514306, "3": 0.05503155670573101, "2": 0.028056274000281323}, "score": 3.737470004660143}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9082999986139062, "4": 0.08039939722715575, "3": 0.00891208551815503, "2": 0.0016875972622325203, "1": 0.0005158518222009867}, "score": 4.8946307320173545}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.996502756650948, "4": 0.003132732663155342, "3": 0.00018981834919235756, "1": 0.00013419923954801667, "2": 3.1442345209742744e-05}, "score": 4.995856469142568}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999259378495597, "4": 0.0007314464104473217, "3": 5.396542970779153e-06, "1": 6.707542576934981e-07, "2": 0}, "score": 4.999255075171505}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5936462356003102, "4": 0.39493657365482626, "3": 0.011107974557572614, "2": 0.0002465334189098542, "1": 0}, "score": 4.582081680696088}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5593322597628816, "5": 0.24703609979926805, "3": 0.1907611227312251, "2": 0.002746160567807725, "1": 7.158571607921621e-05}, "score": 4.050570567464983}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9795596608086719, "4": 0.020245176729458643, "3": 0.00017650329733159755, "2": 1.8301383369614849e-06, "1": 0}, "score": 4.979395979515267}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948469258753517, "4": 0.005114349820370697, "3": 3.643025307804178e-05, "1": 6.754893133679635e-07, "2": 6.045164226090248e-07}, "score": 4.9948082689022995}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9714893273195743, "4": 0.028182566540245823, "3": 0.00030904767652725545, "2": 4.6778030126427166e-06, "1": 0}, "score": 4.971184890317348}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9891918869461296, "1": 0.0069892250108926956, "3": 0.003801274020070866, "4": 1.6374488722235444e-05, "5": 7.198492657346925e-07}, "score": 1.99684695589583}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7401809615829106, "4": 0.25727492983082134, "3": 0.00248689508603104, "2": 4.8783227644087287e-05, "1": 0}, "score": 4.737602718233571}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9147877114218332, "4": 0.08485044862875239, "3": 0.00035715953473342075, "2": 2.8195465043683352e-06, "1": 0}, "score": 4.914426614421478}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8670760931677861, "4": 0.12928536318982808, "3": 0.003421415242186479, "2": 0.0001490025705729773, "1": 0}, "score": 4.8634154936812735}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8949129168948657, "4": 0.1030057569083851, "3": 0.0020139465988651115, "2": 5.2602705719992185e-05, "1": 8.83302959237746e-06}, "score": 4.892772572313262}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9996513670066106, "2": 0.00033154102511250786, "3": 1.914842852608351e-06, "5": 3.8618550500888383e-07, "4": 0}, "score": 1.0003369204362076}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6234807178511483, "2": 0.17573709133629453, "5": 0.11824450760545113, "3": 0.0675711069014842, "4": 0.014895643370901998}, "score": 1.8286030409191836}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9963017928746737, "4": 0.0036388903234741577, "3": 4.891125619186177e-05, "2": 1.3417725763271337e-06, "1": 0}, "score": 4.996259227940904}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8486606993158965, "4": 0.14686037110961958, "3": 0.004367626292264025, "2": 9.665225702710841e-05, "1": 1.065239295966219e-05}, "score": 4.844071186460954}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7990783563513492, "4": 0.1817696596100242, "3": 0.018000831998775293, "2": 0.0010569208041704223, "1": 7.321809266377215e-05}, "score": 4.7787603926697475}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.48950382644212015, "2": 0.3975025618511362, "4": 0.09226283250412812, "5": 0.01475460561278554, "1": 0.005944096718979221}, "score": 2.712372062236392}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.987820864409077, "4": 0.012037205107226565, "3": 0.00013163929360706107, "2": 3.0023807520523978e-06, "1": 0}, "score": 4.987690419441117}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993677023844415, "4": 0.0006262827572168909, "3": 4.344078085546789e-06, "1": 0, "2": 0}, "score": 4.999365028025713}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9932828992568349, "4": 0.0066226187876428635, "3": 8.626332683153938e-05, "2": 3.2236396843593464e-06, "1": 0}, "score": 4.9931951496494875}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9934999453478303, "4": 0.006390965030550393, "3": 0.00010240653797345536, "2": 2.8705239037253227e-06, "1": 0}, "score": 4.993395585142065}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7431176739658624, "4": 0.13708278028142762, "2": 0.10981955162028684, "5": 0.009775133655570908, "1": 0.00019968548584070684}, "score": 3.046414365194524}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.958979524704236, "4": 0.04054644385690196, "3": 0.0004114292025150605, "2": 3.834704831988786e-05, "1": 1.5410568772519225e-05}, "score": 4.958453646856344}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9550220784240525, "4": 0.04468138084695848, "3": 0.00026388477722374466, "2": 2.708347195747055e-06, "1": 0}, "score": 4.954781370367367}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997993406347839, "4": 0.00019926180397820145, "3": 9.88251121436709e-07, "1": 7.093754463890346e-08, "2": 0}, "score": 4.9997984778754105}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986252352560364, "4": 0.0013659201156965407, "3": 5.64446578452653e-06, "1": 1.8714333806441088e-07, "2": 0}, "score": 4.998622038227557}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9954521997043706, "2": 0.004540709507291936, "3": 3.980468627485601e-06, "4": 0, "5": 0}, "score": 1.0045486845924103}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9202783135124015, "3": 0.052199059578154294, "1": 0.02394217813280481, "4": 0.0033190539217228428, "5": 0.0002554522638558198}, "score": 2.035661558002418}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8259622902117354, "5": 0.09798665333945952, "3": 0.07506581627009593, "2": 0.0009707913444943481, "1": 1.188425670149715e-05}, "score": 4.020943655321898}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9298238308242993, "4": 0.06957642432407449, "3": 0.0005884978409527909, "2": 7.990709529008848e-06, "1": 0}, "score": 4.929222377392179}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.995855065054222, "4": 0.004105375772797266, "3": 3.511693729016387e-05, "2": 1.2163840423272633e-06, "1": 0}, "score": 4.995820727718784}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4685803440051546, "3": 0.3489660288695752, "4": 0.1452217346676222, "1": 0.01942080237560558, "5": 0.01763810783052744}, "score": 2.673019439738795}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5874030898599552, "3": 0.3447590540498229, "4": 0.039296551973468964, "1": 0.02160699228022225, "5": 0.0069165305547395925}, "score": 2.4225022700126777}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9906331805323015, "4": 0.009257867948283541, "3": 8.734122363383648e-05, "2": 2.0129052126919477e-06, "1": 0}, "score": 4.990561225913469}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7946729997600941, "4": 0.1931346432288784, "3": 0.010788192823249033, "2": 0.00130565950244965, "1": 7.669116847212139e-05}, "score": 4.781060452101868}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.3848540528773872, "3": 0.38203685346106964, "2": 0.15553988267860822, "5": 0.07057231854270687, "1": 0.0068381298395699345}, "score": 3.3568392003245138}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9352848627985823, "1": 0.041487404659181173, "3": 0.02308796021827023, "4": 0.00012511628163490226, "5": 1.038291386966507e-05}, "score": 1.9818818594428256}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8035377202323305, "3": 0.11205870424034207, "5": 0.08090660615254995, "2": 0.0034360610749621977, "1": 3.938738384174197e-05}, "score": 3.961856796734086}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5219280165176337, "5": 0.46029248711787285, "3": 0.017547699855927405, "2": 0.00015805966020099286, "1": 0}, "score": 4.44246129364286}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6177254659982617, "4": 0.37214392662713763, "3": 0.009708595032406347, "2": 0.0003254007689794649, "1": 0}, "score": 4.607424753688959}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8137850452721676, "4": 0.18412489029823667, "3": 0.002004423080555761, "2": 4.04881183892106e-05, "1": 0}, "score": 4.811736298471147}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"2": 0.969575385724042, "3": 0.021434930956522828, "1": 0.00889575306357922, "4": 8.824716388038773e-05, "5": 4.5932073906685795e-06}, "score": 2.012729465716525}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9778558553280616, "4": 0.02208494112000309, "3": 5.7690675536287165e-05, "2": 5.277664397835901e-07, "1": 0}, "score": 4.977798072358265}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.98712434175012, "4": 0.012740208031096092, "3": 0.00011668693251066594, "2": 1.6471187641299632e-06, "1": 0}, "score": 4.98702125460121}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6757818919801821, "4": 0.3082456959160901, "3": 0.015122418005773307, "2": 0.0007609306761358161, "1": 8.704433251134627e-05}, "score": 4.658877809957744}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944741151806961, "4": 0.005458938074451595, "3": 6.075100090967005e-05, "2": 1.7565691464059633e-06, "1": 0}, "score": 4.994414265420238}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8975980021364451, "3": 0.09883578929434633, "1": 0.001868390899674145, "4": 0.0016552271976967728, "5": 2.199703250148652e-05}, "score": 2.1003459103549877}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6029425623154714, "2": 0.3467192514996222, "4": 0.04971203610740193, "5": 0.00040006240921064765, "1": 0.0002122259603925062}, "score": 2.703364345628622}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8072938101165066, "5": 0.18472927575112294, "3": 0.007918976589521436, "2": 4.3061746808598414e-05, "1": 0}, "score": 4.176726804619885}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.781769491337577, "4": 0.21387233658197072, "3": 0.004243655223935119, "2": 9.937529663380194e-05, "1": 1.0459310701678476e-05}, "score": 4.777299347097501}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6481063148245256, "5": 0.33712250444892283, "3": 0.014365446565244504, "2": 0.00038844265703118295, "1": 9.877185057583748e-06}, "score": 4.321952928076224}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.3721206311464869, "2": 0.25218016662472603, "4": 0.2492573953921528, "5": 0.0931943389514186, "1": 0.03306596742514481}, "score": 3.1173552718558075}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9242092702770793, "4": 0.07107149050585619, "3": 0.004224994584284395, "2": 0.00034585290616129, "1": 0.00013241084591889763}, "score": 4.918910022334157}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9860866400565069, "4": 0.013819048672825667, "3": 8.16602671979056e-05, "2": 9.658782943083945e-07, "1": 0}, "score": 4.986014569736392}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994745075795313, "4": 0.0005158151980217841, "3": 7.223210762237556e-06, "1": 4.686381038240613e-07, "2": 0}, "score": 4.999467862771548}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.882114723004701, "4": 0.11428259437053197, "3": 0.0033942423815597218, "2": 0.00014423552561034338, "1": 5.2533315955761595e-05}, "score": 4.878284660437079}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7323808598416405, "4": 0.2565588771925642, "3": 0.010603231137724245, "2": 0.00039385607786721055, "1": 0}, "score": 4.7210354685048275}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9323559841324295, "4": 0.06702221817572956, "3": 0.0005977753162204337, "2": 1.4477526607446665e-05, "1": 0}, "score": 4.931738147062927}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8974946631395511, "4": 0.10188464877542369, "3": 0.0006050569331383872, "2": 6.79417452804829e-06, "1": 0}, "score": 4.89688394360046}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987852632906639, "4": 0.0012097276830896995, "3": 4.45263278346691e-06, "2": 7.697670448675305e-08, "1": 0}, "score": 4.998781135536887}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8484978569529222, "4": 0.15023025928335326, "3": 0.0011855404884313096, "2": 3.152130158143218e-05, "1": 0}, "score": 4.847295724285251}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"2": 0.850304022430523, "1": 0.13962482150250494, "3": 0.009995272977470222, "4": 6.477563683958591e-05, "5": 9.585567271143806e-06}, "score": 1.8705285624097683}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6449112555158687, "4": 0.31576418309858173, "3": 0.034802414932407225, "2": 0.004156437258077497, "1": 0.0003341281352783821}, "score": 4.600812555958722}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5904825470529839, "5": 0.3976648952852554, "3": 0.011336122164125094, "2": 0.00048289756864556015, "1": 2.008064785431702e-05}, "score": 4.385307921237296}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8698676546474327, "4": 0.12684090428515635, "3": 0.0031078285875767372, "2": 0.00014359165727623438, "1": 2.4437053291927095e-05}, "score": 4.866412833563115}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.6415378463616758, "3": 0.329732486580205, "1": 0.01698877410186698, "4": 0.011219538630604799, "5": 0.0005181390061830185}, "score": 2.336738289479273}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4663137164945095, "3": 0.27072203110182075, "5": 0.18413249481323812, "2": 0.06914986314339067, "1": 0.008538196296395163}, "score": 3.7492093196981897}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7475813127759448, "5": 0.241007457978842, "3": 0.011144145346619465, "2": 0.00022551813070819342, "1": 0}, "score": 4.2294218124646115}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7418810193149247, "5": 0.23252912336834425, "3": 0.02491092043423226, "2": 0.0006009989923817139, "1": 0}, "score": 4.206432293846782}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9762627058087524, "4": 0.023572207717531712, "3": 0.00014514330402115336, "2": 3.7881794896943095e-06, "1": 0}, "score": 4.976125755447771}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7682429305741645, "5": 0.18918827419470935, "3": 0.03885185715863323, "2": 0.0034163894566378605, "1": 0.00019567254199958045}, "score": 4.142931610602952}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8294862049918938, "3": 0.1652946070358232, "1": 0.004161783793922402, "4": 0.001038192976155523, "5": 1.795402920453479e-05}, "score": 2.1632632765320086}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.751862099629791, "3": 0.1332978208024163, "4": 0.09996254631504893, "1": 0.007521106581883118, "5": 0.007321310038598137}, "score": 2.347677946245009}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5976376949065189, "4": 0.3972819296819541, "3": 0.0050123671020884265, "2": 6.273820285109694e-05, "1": 0}, "score": 4.592502973952555}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9632425131452278, "4": 0.03669908705927842, "3": 5.455659253045877e-05, "2": 1.0069193870642527e-06, "1": 0}, "score": 4.963188674590141}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6883996658815289, "3": 0.297432610197678, "5": 0.012509974410862667, "2": 0.0016529577831559004, "1": 4.47028228645743e-06}, "score": 3.7117579451461937}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9329218254650029, "3": 0.05319185477976068, "1": 0.013357055925704697, "4": 0.0005075725000551145, "5": 2.121341061710091e-05}, "score": 2.0409136036394004}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5130116112766347, "3": 0.4145961355233083, "4": 0.06299877482512135, "1": 0.008930900940401514, "5": 0.0004618871318890017}, "score": 2.5330488135938225}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6419413978923557, "4": 0.3522778740124249, "3": 0.005709702261606992, "2": 6.505386102760534e-05, "1": 5.2555336914525115e-06}, "score": 4.636086277024567}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.30220399787360924, "1": 0.22668336569725164, "3": 0.2145617936108246, "2": 0.19722560548187343, "5": 0.059285566534441544}, "score": 2.770173676671549}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5474449008897943, "3": 0.36687734375165426, "4": 0.08249117178780503, "1": 0.002638235385225274, "5": 0.00054810236007556}, "score": 2.53086588952261}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8422449100421437, "4": 0.12269552487705929, "3": 0.024362493035942803, "2": 0.00905640714446502, "1": 0.001582952665973497}, "score": 4.795066629791064}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9919185598428627, "4": 0.007983426290157877, "3": 6.224306091984365e-05, "2": 3.987416621661811e-06, "1": 0}, "score": 4.991879867252797}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9779316636080452, "4": 0.021800416584258926, "3": 0.00021270230477823113, "2": 6.327635058936804e-06, "1": 0}, "score": 4.977754108302302}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970077652846782, "4": 0.002971654531400712, "3": 1.5518650489282217e-05, "2": 4.5063145701006714e-07, "1": 0}, "score": 4.996995942421835}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9933659379995458, "4": 0.006562399273383119, "3": 4.890406676563742e-05, "2": 2.6104472269155283e-06, "1": 0}, "score": 4.993331826899632}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"2": 0.49860977659113886, "3": 0.376355331976996, "4": 0.08879830650992868, "5": 0.01904243631660376, "1": 0.017014046693769627}, "score": 2.5941722188052996}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.651565435005673, "4": 0.20716139572996442, "3": 0.0968430550511736, "2": 0.0354497882224744, "1": 0.008725120500879173}, "score": 4.457764265960637}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991427438541807, "4": 0.0008467235532490857, "3": 7.430451009000933e-06, "1": 3.6600201430302934e-07, "2": 0}, "score": 4.999136949175249}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9874185486386107, "4": 0.012315052306960752, "3": 0.000250887481554416, "2": 7.324482895676085e-06, "1": 0}, "score": 4.987161094167967}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.882206935276087, "4": 0.10798758631413381, "3": 0.009061949549604858, "2": 0.0005694406469994572, "1": 0.0001676642651158393}, "score": 4.871508710163822}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7398144259327324, "4": 0.2555121542550382, "3": 0.004564706776346931, "2": 6.477013114444989e-05, "1": 0}, "score": 4.735152483629652}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9593710590937772, "4": 0.040398307033680275, "3": 0.00021535967943858228, "2": 9.012797916294606e-06, "1": 0}, "score": 4.959143679396124}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9945370668873348, "4": 0.005440915183514778, "3": 1.7111479566697727e-05, "2": 5.557212596329187e-07, "1": 0}, "score": 4.994523170865377}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9641748511096156, "4": 0.03557725321419923, "3": 0.00021946429584022368, "2": 1.0458170698943269e-05, "1": 0}, "score": 4.963951795780091}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5846645003158734, "4": 0.40243573881007677, "3": 0.01243459962091817, "2": 0.0003930753241328974, "1": 0}, "score": 4.571484946069935}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7721409252161577, "1": 0.10766090067110584, "3": 0.09849114828195758, "4": 0.01955258062467527, "5": 0.0021478799351723975}, "score": 2.0363792875055986}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9482485031061808, "4": 0.05081863301578512, "3": 0.0008491459315737259, "2": 5.192386743474566e-05, "1": 1.546014709958509e-05}, "score": 4.9472646015539565}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8840328998607349, "4": 0.1122456394370839, "3": 0.003263500130177762, "2": 0.0003601771731284466, "1": 6.868237100742144e-05}, "score": 4.8798686033520235}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939817858380908, "4": 0.005848999254376827, "3": 0.0001388934452141995, "2": 1.1054919781395575e-05, "1": 0}, "score": 4.993839930412607}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8617390330817986, "4": 0.13020764937153345, "3": 0.00779334199645677, "2": 0.00020463145034677163, "1": 5.3618467838780154e-05}, "score": 4.853377045395891}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.398913969750842, "3": 0.38102263354117427, "2": 0.15327817057726675, "5": 0.06382702429652014, "1": 0.0029366388498170844}, "score": 3.3674244928355805}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.809375383720112, "4": 0.17957146797788062, "3": 0.00985848276497083, "2": 0.0009899610094551117, "1": 0.00010526137660334891}, "score": 4.797300480878516}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8864208776154181, "4": 0.11161057226103993, "3": 0.001937784439554385, "2": 2.3723344372305933e-05, "1": 0}, "score": 4.884441875027174}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9940204202753591, "4": 0.005851914536987624, "3": 0.00011104700253708176, "1": 7.153663177059116e-06, "2": 5.3365296208185e-06}, "score": 4.993881341958594}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955380873419685, "4": 0.004385983898964082, "3": 6.97256013424197e-05, "2": 2.1881546388734973e-06, "1": 0}, "score": 4.995467982238369}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6635971867838195, "3": 0.2963553316062154, "4": 0.029920410681024225, "1": 0.009039270542817916, "5": 0.0010854384198619327}, "score": 2.350414025351137}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5028232461207236, "4": 0.40721576454244984, "3": 0.08140291465843529, "2": 0.008046862621325266, "1": 0.00034134986827305525}, "score": 4.4043712439994085}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9610354327345813, "4": 0.03861190231160017, "3": 0.00034467438437880076, "2": 2.557777092310708e-06, "1": 0}, "score": 4.960690862029981}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9759219675949473, "4": 0.02277135710754141, "3": 0.0012220746887627997, "2": 4.335901143938302e-05, "1": 2.5629334079439126e-05}, "score": 4.974551501835645}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8105472193275262, "4": 0.18435428698041587, "3": 0.004750128541183255, "2": 0.00016227031535790605, "1": 0}, "score": 4.805622472337105}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9352553550266485, "2": 0.06460391282380047, "3": 0.0001286445992881423, "4": 6.672773902817344e-07, "5": 0}, "score": 1.0648639446184947}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.82652538362724, "1": 0.1166821625651321, "3": 0.05511959499498151, "4": 0.0014823153321670169, "5": 0.00010802574279825537}, "score": 1.941721331298682}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.40570245805032806, "3": 0.3493546792195343, "5": 0.21030069320745595, "2": 0.03320941031497489, "1": 0.001380610619194817}, "score": 3.7903744298227866}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.45251859172550146, "4": 0.263777614538619, "2": 0.21060010093686854, "5": 0.06235452720182826, "1": 0.010604226827874992}, "score": 3.1567008263745815}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.43746389600799895, "2": 0.26122760548732976, "1": 0.1251658651577311, "4": 0.10242353078016465, "5": 0.0735406694456837}, "score": 2.737898766327574}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7807458330070145, "3": 0.14318833317732757, "5": 0.05157115883832677, "2": 0.024321722449215863, "1": 0.000160786686507259}, "score": 3.8592553084254213}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6095336636516784, "4": 0.3815135542710625, "3": 0.007070345017868955, "2": 0.001696248213536216, "1": 9.857350937989298e-05}, "score": 4.59882756815747}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9222112132912026, "4": 0.07754144588164995, "3": 0.0002384840800925086, "2": 5.937282623812611e-06, "1": 0}, "score": 4.921963546285643}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9538635043229365, "4": 0.04598726355823317, "3": 0.00014390733103854478, "2": 3.3259573516191417e-06, "1": 0}, "score": 4.953714851391472}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9374084399128305, "4": 0.06219354890310374, "3": 0.00039500327577352825, "2": 2.8136696537434465e-06, "1": 1.7091234742839547e-07}, "score": 4.9370073184176135}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6204402948490333, "1": 0.3688073455732805, "3": 0.009992474692814663, "4": 0.0004215136486111499, "5": 0.0003254194800616198}, "score": 1.6429997910772722}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9981073099011641, "4": 0.0018745635874706768, "3": 1.3332391933481306e-05, "2": 2.647097220042577e-07, "1": 0}, "score": 4.998097968884419}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9154326902157726, "4": 0.08363133571462993, "3": 0.0009113755557909849, "2": 1.3361448166955039e-05, "1": 0}, "score": 4.914504868114879}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987008484290155, "4": 0.001290299780012222, "3": 7.4322493957411304e-06, "2": 2.1793434265563717e-07, "1": 0}, "score": 4.998694180349086}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996418377554159, "4": 0.0003547263183630614, "3": 2.654495341151354e-06, "2": 1.638173089278575e-07, "1": 0}, "score": 4.999639473016362}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5463315462287954, "4": 0.4436699272981765, "3": 0.00978011535514862, "2": 0.00012968838804328775, "1": 0}, "score": 4.536339639614505}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9909197725339052, "4": 0.009039262407478089, "3": 3.7576488838366136e-05, "2": 9.357729169495914e-07, "1": 0}, "score": 4.990882754933345}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9946501634201637, "4": 0.005313736600287156, "3": 2.751588730296351e-05, "2": 1.1763360411843229e-06, "1": 0}, "score": 4.994627662820021}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9275310202929834, "4": 0.07167305528385341, "3": 0.0007191231035122552, "2": 4.1801430354995064e-05, "1": 0}, "score": 4.926760730851745}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9727565759264999, "4": 0.02706599056284051, "3": 0.00016079762037368855, "2": 5.946504440723641e-06, "1": 0}, "score": 4.9725942817327935}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"4": 0.474107921838197, "5": 0.30134352075930204, "3": 0.1489972842072154, "2": 0.07219660906824975, "1": 0.0032430825407739035}, "score": 3.9982235725766757}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9630660180160168, "4": 0.035755391858418244, "3": 0.0011461480277097438, "2": 2.573761544865571e-05, "1": 0}, "score": 4.961874843630376}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982615998709594, "4": 0.0016937242100346433, "3": 4.0652793644090235e-05, "2": 1.4039470033146166e-06, "1": 0}, "score": 4.998220753701504}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998598718912488, "4": 0.001393243216999268, "3": 6.461377678379633e-06, "1": 1.5999536354119216e-07, "2": 0}, "score": 4.99859319205345}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9738929295262582, "4": 0.02360378024276041, "3": 0.0020733222636271404, "2": 0.0002969333069802553, "1": 0.00012425520531273357}, "score": 4.97086149866763}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.680202895215592, "2": 0.26861616883489553, "4": 0.04689114159223979, "5": 0.0025169863146776925, "1": 0.0017710122556837363}, "score": 2.779766525382941}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9866598136315117, "4": 0.013076465384692879, "3": 0.00024103678530523986, "2": 7.3100240075603325e-06, "1": 0}, "score": 4.986419322180963}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9981562423133462, "4": 0.0018267113597010653, "3": 1.418527646413766e-05, "2": 2.055369528405963e-07, "1": 0}, "score": 4.998144296548667}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995847869048258, "4": 0.00040917320805160565, "3": 4.476558494235573e-06, "1": 2.813878134675743e-07, "2": 0}, "score": 4.99958074758625}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9915897814372565, "4": 0.008121952484148839, "3": 0.00024510594801931514, "2": 1.475452120166473e-05, "1": 0}, "score": 4.991343326158111}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"5": 0.99793122137843, "4": 0.0020236823127099293, "3": 3.831833713437746e-05, "1": 6.46282579009903e-07, "2": 0}, "score": 4.997897082988272}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9994811795339072, "4": 0.0005074013247211888, "3": 9.210918353672608e-06, "1": 7.28059544644808e-07, "2": 0}, "score": 4.999471263817776}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9828138510273524, "4": 0.016624246778882083, "3": 0.0005510166122454775, "2": 7.513546249346061e-06, "1": 2.031614014064386e-06}, "score": 4.982243029100001}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998364025435236, "4": 0.0001607122595025873, "3": 1.6048616571811488e-06, "1": 2.333561522489797e-07, "2": 0}, "score": 4.999835144419974}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996308859893444, "4": 0.0003571011796331869, "3": 6.689569738620009e-06, "1": 3.6442863515469547e-06, "2": 0}, "score": 4.999614941888981}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7532632731138952, "3": 0.1855980992114682, "1": 0.03255539106255753, "4": 0.025756282527000046, "5": 0.002725993037008346}, "score": 2.212754732254686}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6789284041914208, "5": 0.17273958631065112, "3": 0.1277577610352495, "2": 0.020074663127248947, "1": 0.0004898251829533176}, "score": 4.003363056295987}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7061729781185132, "5": 0.1458449365650821, "3": 0.1352843796786187, "2": 0.012293200184492124, "1": 0.00034296279022229465}, "score": 3.984944341581499}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9852565902676862, "4": 0.014668792515452337, "3": 7.214035222360777e-05, "2": 1.583115210286809e-06, "1": 4.567407014357807e-07}, "score": 4.985180343995345}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.609715514665276, "4": 0.38284050981092194, "3": 0.007180250557091674, "2": 0.00021525740788226654, "1": 2.26169258631018e-05}, "score": 4.602052461952049}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5713466275533949, "5": 0.1844275823759853, "3": 0.13341309325229328, "2": 0.09951229247360882, "1": 0.011258419840492204}, "score": 3.818207012166532}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9281457224699236, "4": 0.07087334983192348, "3": 0.0008235869730658682, "2": 0.00011841632084967175, "1": 0}, "score": 4.927121390502938}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9910366029162335, "4": 0.008935179866672997, "3": 1.9163828271080715e-05, "2": 7.725238151318958e-07, "1": 0}, "score": 4.991024100577127}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947215228788008, "4": 0.005266301318123946, "3": 1.1315138936366307e-05, "2": 2.885717735895029e-07, "1": 0}, "score": 4.994710199662428}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993074619152728, "4": 0.0006903148224566541, "3": 1.6892515448436944e-06, "2": 1.88121275433386e-07, "1": 0}, "score": 4.99930574207049}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8053793019408418, "4": 0.18555107461139647, "3": 0.008488435256026185, "2": 0.00043147602973651243, "1": 0}, "score": 4.796147107530081}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9898621252265918, "4": 0.009964704296175164, "3": 0.00013712604755245893, "2": 3.6857482500670643e-06, "1": 0}, "score": 4.989749654676311}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9911568635847954, "4": 0.008585513266414279, "3": 0.00014689904144896192, "2": 6.180032670623445e-06, "1": 0}, "score": 4.99110121823777}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9155925570297033, "4": 0.07935676344819825, "3": 0.0049331453121919345, "2": 7.75088061746618e-05, "1": 0}, "score": 4.910540838869852}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916808651249065, "4": 0.007982521020946307, "3": 0.0003025604396363762, "2": 1.3691491177716082e-05, "1": 0}, "score": 4.991371107925409}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6502070944439424, "4": 0.3090741695441436, "3": 0.038262491379865544, "2": 0.0022700100958220858, "1": 0.0001640489006319863}, "score": 4.606925901207414}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.709481583309085, "5": 0.24044238056282385, "3": 0.04461322228962133, "2": 0.005209587505290064, "1": 0.0001868881964234053}, "score": 4.184861582046263}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9947930092196557, "4": 0.0051529660399664695, "3": 3.4814102814031834e-05, "2": 1.0709344209279065e-06, "1": 0}, "score": 4.994774098154835}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8988638302526769, "4": 0.0998936658742452, "3": 0.001176463940588619, "2": 3.654230234883794e-05, "1": 0}, "score": 4.8976407599825285}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969311009274306, "4": 0.003012807230913621, "3": 2.1678425685759467e-05, "1": 0, "2": 0}, "score": 4.99694373074105}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8632781792810861, "3": 0.11900959010501061, "4": 0.015397301687683457, "1": 0.0019376584876592945, "5": 0.0003575697893203712}, "score": 2.1489421786182974}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.81143207382333, "3": 0.1179784262053393, "5": 0.037137367723643365, "2": 0.03331538422303242, "1": 0.00013044015744680416}, "score": 3.852135919892917}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7732289272273078, "3": 0.1921289534205037, "5": 0.03137878661149212, "2": 0.003248964983425718, "1": 1.078198362145143e-05}, "score": 3.832718957441318}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7287174411374296, "4": 0.27016418829723277, "3": 0.0010730443322687212, "2": 3.482019581514629e-05, "1": 0}, "score": 4.727582400421334}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5665124962860483, "4": 0.4026311084033891, "2": 0.025148563534299277, "5": 0.0056974646576307825, "1": 8.429340681347123e-06}, "score": 3.3888613690299754}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9233218180247234, "2": 0.07648852112973979, "3": 0.00017775666384459485, "5": 3.393541471547022e-06, "4": 0}, "score": 1.0768582627363374}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.617111597673553, "5": 0.21540164011781557, "3": 0.10224753417478882, "2": 0.05924477431924723, "1": 0.005920721278046229}, "score": 3.9769006903020068}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.70668386006465, "4": 0.29021005227609786, "3": 0.0029561486192850655, "2": 6.83577919883061e-05, "1": 0}, "score": 4.7036484003760295}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8882816223348242, "4": 0.10815016510008496, "3": 0.0028019532940399055, "2": 0.00047645989700322386, "1": 0}, "score": 4.884783158852382}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7931227320730003, "4": 0.19935745685706557, "3": 0.006724992289753143, "2": 0.0006859471321808163, "1": 9.667168608332565e-05}, "score": 4.784745404324683}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6152775574868168, "3": 0.16440662485507132, "1": 0.11322057180474555, "4": 0.061686597011933283, "5": 0.0451406909900253}, "score": 2.310064404235826}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8471898376385039, "4": 0.13627582801374805, "3": 0.009795952390499843, "2": 0.004012338662729252, "1": 0.002565620292912374}, "score": 4.821804183337632}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9933852345189833, "4": 0.006547236020482468, "3": 4.808674454582049e-05, "2": 2.8109557721860414e-06, "1": 0}, "score": 4.993348046989422}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977449976465389, "4": 0.0022163497347702853, "3": 2.4100547497189562e-05, "1": 2.3774430417899155e-06, "2": 0}, "score": 4.997725911711889}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.827001012214254, "4": 0.16341897127851746, "3": 0.0068861095851291045, "2": 0.0014535768020116399, "1": 0.001029602472775124}, "score": 4.814290535135474}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"4": 0.682751057326806, "5": 0.2310121205323094, "3": 0.07435400802477607, "2": 0.011227613993412924, "1": 0.0006004779118810057}, "score": 4.132408696481668}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.534373685060306, "5": 0.4242639473919228, "3": 0.03555182101479243, "2": 0.0052919117975391795, "1": 0.00039420676580949836}, "score": 4.376992590907275}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9868659612258632, "4": 0.01306635464954874, "3": 5.829058324722629e-05, "2": 7.091689822180386e-07, "1": 0}, "score": 4.9868148221720165}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9639082801218395, "4": 0.035610925220087505, "3": 0.00043517861585167704, "2": 2.412784476429462e-05, "1": 0}, "score": 4.963445548524645}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9886510576734606, "4": 0.01123636034137821, "3": 9.665138716070953e-05, "2": 4.474880099518913e-06, "1": 0}, "score": 4.988556781153715}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9096718762897401, "1": 0.08978088394486483, "3": 0.000542895883233611, "4": 9.10385227581936e-07, "5": 0}, "score": 1.910763526315665}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.45927303420944404, "3": 0.3259927947022574, "5": 0.1560307618228669, "2": 0.0517357110468577, "1": 0.006614331795812759}, "score": 3.7066198789555735}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8906452668701523, "4": 0.10781080431207828, "3": 0.0014566354339454414, "2": 2.366505666842034e-05, "1": 0}, "score": 4.889197879496453}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943809870406026, "4": 0.005553221884113821, "3": 6.0652663962629724e-05, "2": 1.4301817841335975e-06, "1": 0}, "score": 4.994321161184171}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.47778976758797503, "4": 0.4613969378102435, "3": 0.05949000284257044, "2": 0.0012836707908599906, "1": 2.364800031211773e-05}, "score": 4.415668118616322}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"1": 0.5479476641339844, "2": 0.45082747115387917, "3": 0.0012058885474468986, "4": 1.1299613910975507e-05, "5": 0}, "score": 1.4532766266915478}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5765991084489891, "5": 0.39238232328472017, "3": 0.028976454284684216, "2": 0.0017622259935785739, "1": 0}, "score": 4.359982171698641}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7449026204137593, "4": 0.2525307892693812, "3": 0.0023545303456523757, "2": 3.857901817027017e-05, "1": 0}, "score": 4.742599758945672}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938261066876901, "4": 0.0061163699736280115, "3": 5.37454793290293e-05, "2": 1.3166169867677556e-06, "1": 0}, "score": 4.993772173888565}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7868501541716773, "5": 0.19758587085403753, "3": 0.01498175727044077, "2": 0.0005155824631434923, "1": 0}, "score": 4.181585048620732}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9672761503456061, "3": 0.03053447823175336, "1": 0.0021180720805850984, "4": 6.923015668665981e-05, "5": 1.733111863961201e-06}, "score": 2.0285600753984183}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7668313917557551, "5": 0.19254463153461096, "3": 0.03821762814689694, "2": 0.002318838187469221, "1": 6.433292531509628e-05}, "score": 4.149499793260806}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8418128145206575, "3": 0.08553675605823759, "5": 0.0710429610300936, "2": 0.001534214124583852, "1": 4.0167072099063404e-05}, "score": 3.98231669041529}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8368891203232734, "5": 0.08657401207178966, "3": 0.07035598671763685, "2": 0.006041841073428893, "1": 7.763881985484073e-05}, "score": 4.003901666313921}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.868515436249075, "4": 0.13038847699459621, "3": 0.0010455760514903598, "2": 2.1657126263691434e-05, "1": 0}, "score": 4.867451575027237}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6877766158742963, "5": 0.2001192780408123, "3": 0.10608832257238877, "2": 0.005880849821786418, "1": 0.00011445337764853377}, "score": 4.081927573594261}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9385362108023612, "4": 0.06039046806431184, "3": 0.0010134326977999189, "2": 2.696308094699725e-05, "1": 0}, "score": 4.937499719453349}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9522211792790567, "4": 0.047244289003417886, "3": 0.00050967682987979, "2": 4.278175176153242e-06, "1": 0}, "score": 4.951722529419663}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978274778498202, "4": 0.0021578973078549566, "3": 1.2698267387344187e-05, "1": 2.3428535470040559e-07, "2": 0}, "score": 4.997815765319593}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9979427382697329, "4": 0.0020422359856022876, "3": 1.2135554810147107e-05, "2": 2.1245364787973635e-07, "1": 0}, "score": 4.997932850008551}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4948414850108858, "4": 0.34179849892045716, "2": 0.14776442445738933, "5": 0.015182807148005113, "1": 0.00040903574894812295}, "score": 3.223582455407933}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.46972444661850166, "4": 0.42267078035471844, "3": 0.0778396762722387, "2": 0.02639008256037075, "1": 0.0032793393321481844}, "score": 4.329298092778668}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9052501415235249, "4": 0.09167663779077324, "3": 0.00294856549435357, "2": 0.0001014557312440814, "1": 0}, "score": 4.902119593254197}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.983525265606523, "4": 0.016286805133574302, "3": 0.00015841822949658955, "2": 1.6062149765966562e-05, "1": 0}, "score": 4.983347948006675}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.515026254503176, "1": 0.27738415289619806, "3": 0.16532685915974826, "4": 0.027060204472613255, "5": 0.015150762776657003}, "score": 1.9875147572252774}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9763001959927438, "2": 0.023528237110036633, "3": 0.00015601443857963924, "4": 5.001778543897717e-06, "5": 0}, "score": 1.0238555230148196}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8491868962258596, "5": 0.09609704622026143, "3": 0.05431032080660814, "2": 0.00039193270650083494, "1": 9.101512040022417e-06}, "score": 4.040975748154165}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7418606549604465, "5": 0.25351459085344413, "3": 0.004516097694306053, "2": 6.376079850223234e-05, "1": 0}, "score": 4.248882145298597}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9039132008126812, "4": 0.09588938417880617, "3": 0.0001737555728633611, "2": 2.4934232312046294e-06, "1": 0}, "score": 4.903753587253007}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9663439540990936, "4": 0.03356516183710625, "3": 8.734139831645846e-05, "2": 1.2908133944024098e-06, "1": 0}, "score": 4.966256206940046}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9996604233691999, "2": 0.0003138141896241927, "3": 1.765144338043982e-05, "5": 1.809603133478124e-06, "4": 0}, "score": 1.0003563577344698}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6907975495361472, "3": 0.18752653942275377, "1": 0.07914802860820361, "4": 0.03385227749188096, "5": 0.00866405605005309}, "score": 2.2020775677202673}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958881651378514, "4": 0.004073221782174505, "3": 3.502610210492486e-05, "2": 1.7775154203575616e-06, "1": 0}, "score": 4.995851385960593}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9710101709780474, "4": 0.028833257032142196, "3": 0.0001399208013596642, "2": 7.697438090393814e-06, "1": 0}, "score": 4.97086354817035}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8145722501199397, "4": 0.1809369049364105, "3": 0.0041660463934315465, "2": 0.0002761489952623836, "1": 4.077411965512082e-05}, "score": 4.809737960415935}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9370590016964137, "3": 0.03245096169699991, "1": 0.028596223938369927, "4": 0.001579235831325454, "5": 0.0003082464292279665}, "score": 2.007937998959734}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9640445420432248, "4": 0.033795074904328766, "3": 0.0019608759349216366, "2": 0.0001593497637002083, "1": 3.781268233886426e-05}, "score": 4.96165378329609}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7059615674572746, "5": 0.22994880081300403, "3": 0.06350926996736808, "2": 0.0005682449398878984, "1": 9.728070360353673e-06}, "score": 4.1652742515539956}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9865460898825944, "4": 0.012348562740104381, "3": 0.0009724712946273597, "2": 9.929513311974692e-05, "1": 3.2069600546880624e-05}, "score": 4.985280308622502}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973269720184172, "4": 0.0026424847798248684, "3": 2.8939503300124e-05, "2": 8.668897767708387e-07, "1": 3.8745194838883727e-07}, "score": 4.997295484791611}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.29762546851423594, "2": 0.2680132927199497, "5": 0.2080227146906017, "3": 0.1405623101371028, "1": 0.08543262716825874}, "score": 3.2748867983060768}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.49709881982709964, "4": 0.46992341705065976, "3": 0.031774642911589324, "2": 0.0011245694811387126, "1": 6.484666985654493e-05}, "score": 4.462886841372551}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6042102171262491, "5": 0.3702025095360882, "3": 0.024122033573531595, "2": 0.001368030725326514, "1": 6.186809124227487e-05}, "score": 4.343170938224309}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998408802099907, "4": 0.0015588186815501074, "3": 2.699793976152589e-05, "2": 2.050235281369364e-06, "1": 1.8552149362847687e-06}, "score": 4.998373611473069}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.928332660560071, "4": 0.06910592545525318, "3": 0.0023850719199051246, "2": 0.00013822220314774618, "1": 2.9654994444835676e-05}, "score": 4.925590014247068}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6179804539112159, "4": 0.36024623328261984, "3": 0.021344646930412964, "2": 0.00040508768828889663, "1": 1.8565937005418835e-05}, "score": 4.595772919956299}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7419117709204979, "3": 0.19188811714627277, "5": 0.03741417633467118, "2": 0.028570301779060038, "1": 0.0001912254422573434}, "score": 3.7878066000069515}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9746954673036461, "4": 0.025175786488788876, "3": 0.00012405730028767386, "2": 1.761459202661808e-06, "1": 0}, "score": 4.974570740090189}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8060302066052751, "4": 0.18687283877269667, "3": 0.006971227205865853, "2": 0.00010796558921384515, "1": 1.2867600436627419e-05}, "score": 4.7988083549687}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963313747096243, "4": 0.0036481156681308726, "3": 1.7834050118097226e-05, "2": 2.865436374997269e-07, "1": 0}, "score": 4.996315347797982}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6556408334245132, "5": 0.20172550335444342, "3": 0.11844613247843698, "2": 0.0230929362098411, "1": 0.001038250389814577}, "score": 4.033980661898152}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9881580780561983, "4": 0.011598273826536894, "3": 0.00022679341974536158, "2": 8.339836050502282e-06, "1": 4.498421502261329e-06}, "score": 4.987905077561281}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.893677783425711, "4": 0.10004167798226314, "3": 0.00607593738257722, "2": 0.00017242262031811657, "1": 1.908274565582821e-05}, "score": 4.887211371346778}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9445649054748515, "4": 0.05456125300917242, "3": 0.0008561821606196343, "2": 1.4247444509475883e-05, "1": 1.928208932823937e-06}, "score": 4.943675843932071}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9747075877171405, "4": 0.02479618173408251, "3": 0.0004847977811768829, "2": 8.972367332919724e-06, "1": 2.0519028004077597e-06}, "score": 4.974199087450756}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7012317341797369, "3": 0.1617964686496204, "5": 0.13295592455592073, "2": 0.00396279775255964, "1": 3.110384851412989e-05}, "score": 3.9631397389983416}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9819577951633482, "4": 0.017877277248483647, "3": 0.00015368984190610263, "2": 5.749181851352707e-06, "1": 0}, "score": 4.981797995619276}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.525936813440064, "3": 0.37287818292948127, "5": 0.09371790681927838, "2": 0.007376990609674932, "1": 7.966716814608128e-05}, "score": 3.705843670458273}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8862249647977123, "4": 0.10977382130103704, "3": 0.0037627225543449844, "2": 0.00015590698165461933, "1": 0}, "score": 4.882223286130152}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5214659756032739, "4": 0.36424749903414616, "2": 0.06608071034858093, "5": 0.043088204363115425, "1": 0.005112507452053003}, "score": 3.3741200917169043}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7304743655913918, "3": 0.1777668355528469, "1": 0.058736784261679574, "4": 0.025256255787154406, "5": 0.007756314447037081}, "score": 2.192813327205041}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9399343279891585, "4": 0.05800415111781436, "3": 0.0018393721286947085, "2": 0.00020019052897888087, "1": 1.596138803679918e-05}, "score": 4.937652313596157}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9677861282570756, "4": 0.03170008869985929, "3": 0.0004741429497427825, "2": 2.281347928457295e-05, "1": 0}, "score": 4.96728263444032}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984569307574775, "4": 0.0015294767431708052, "3": 1.2217093259342855e-05, "2": 5.803050055442254e-07, "1": 0}, "score": 4.998444346918391}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9913226028327606, "4": 0.00854240239373759, "3": 0.00011726103968198054, "2": 6.31863723771607e-06, "1": 0}, "score": 4.991204019208214}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4195249413063219, "3": 0.30057733611439724, "1": 0.1801300840390713, "5": 0.05453785670545278, "4": 0.0452161479686987}, "score": 2.374498223987707}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9988969486089252, "4": 0.0010938915626052066, "3": 6.897465725407307e-06, "2": 1.2775339919966945e-07, "1": 0}, "score": 4.998891927880445}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.994621390298022, "4": 0.0053185211159365, "3": 5.619476246390229e-05, "2": 6.229531634736811e-07, "1": 0}, "score": 4.9945672027296695}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939634156340735, "4": 0.005899498096964964, "3": 0.00011516772659928399, "2": 5.23963876492012e-06, "1": 0}, "score": 4.993854345030755}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990943073873628, "4": 0.0008982566757924396, "3": 6.013924665487036e-06, "2": 2.2770907718565324e-07, "1": 0}, "score": 4.999089031259673}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.498911910938227, "2": 0.40625513720112033, "4": 0.08639547303267218, "5": 0.00554762428290853, "1": 0.002868560336440809}, "score": 2.6854917665205473}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.615905559316571, "4": 0.20078995847692876, "2": 0.1633666038905449, "5": 0.017900224935237446, "1": 0.0020132509005040145}, "score": 3.0691989912828657}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.940569176545654, "4": 0.05799087548707738, "3": 0.0013782597862912623, "2": 1.7899245443508643e-05, "1": 0}, "score": 4.939196244672288}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941701558778425, "4": 0.005763474928386937, "3": 5.916206591046903e-05, "2": 2.568334303804731e-06, "1": 0}, "score": 4.994110468616561}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9667652539801229, "4": 0.030683761674771565, "3": 0.002182240887704226, "2": 0.00017559997835962945, "1": 0.0001266200104902513}, "score": 4.963916076145006}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8025675203576561, "2": 0.19621189632978614, "3": 0.0011131571741413145, "5": 1.598985658822651e-05, "4": 0}, "score": 1.1985203220645386}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.4904337035843258, "1": 0.3604366737363669, "3": 0.11738369093737006, "4": 0.020419480649340054, "5": 0.010958005433700025}, "score": 1.8305975792142382}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9241931799337506, "4": 0.07399544808757469, "3": 0.0014610747265290053, "2": 7.102717554497974e-05, "1": 0}, "score": 4.922847774624843}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9644902389586555, "4": 0.03165577128302943, "3": 0.0036532266068885974, "2": 0.000108816454365529, "1": 7.953654153160415e-05}, "score": 4.960392688441074}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9342537375834823, "4": 0.06241728117756128, "3": 0.0030031065783039947, "2": 0.0001490137461848503, "1": 0}, "score": 4.931117281766738}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7024152188277181, "5": 0.18944231635131517, "3": 0.10541943152998884, "2": 0.002633215910818209, "1": 7.85267678170682e-05}, "score": 4.078521759254983}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6856503191950206, "4": 0.3101244532408566, "3": 0.004158675270560536, "2": 6.088894054415053e-05, "1": 0}, "score": 4.681373724903314}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7211634199710457, "4": 0.2741778762029218, "3": 0.004568076773323807, "2": 6.93762477828725e-05, "1": 0}, "score": 4.716471816304959}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9752303270608116, "4": 0.024559665389549897, "3": 0.00019937162748579154, "2": 4.15909523055961e-06, "1": 0}, "score": 4.975028952336634}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9813257631623845, "4": 0.01854779620409642, "3": 0.00012486767267430232, "2": 1.2508865725683637e-06, "1": 2.1674397904731587e-07}, "score": 4.981197846834485}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7742387425865835, "4": 0.21159404967964013, "3": 0.013653273080200284, "2": 0.0004147405143171448, "1": 0}, "score": 4.759831359295418}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9728022732127402, "4": 0.026340687026408537, "3": 0.0007895203095712655, "2": 3.354358231592645e-05, "1": 0}, "score": 4.97197868955913}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998027755235673, "4": 0.0019578571394949177, "3": 7.499149078939837e-06, "1": 0, "2": 0}, "score": 4.998027130972288}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990005595736067, "4": 0.0009904764182840442, "3": 5.415306917421372e-06, "1": 9.011907369573948e-08, "2": 0}, "score": 4.998998329027226}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9798546447519025, "4": 0.01996980891905581, "3": 0.00017040186479437138, "2": 2.5921627295052274e-06, "1": 0}, "score": 4.979681559004379}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"3": 0.46508109069839776, "2": 0.34575276892827334, "4": 0.10998961794084174, "5": 0.05310650784275065, "1": 0.025606967411882665}, "score": 2.8191521888057096}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5469262565496898, "4": 0.27667332524461535, "2": 0.14554709030854218, "5": 0.029791939757284728, "1": 0.001041324310919703}, "score": 3.1886312504939474}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5553802081790336, "4": 0.37512949223190256, "3": 0.06696618422911045, "2": 0.002301790455444695, "1": 0}, "score": 4.483918030068859}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6437628152615044, "4": 0.3464860572425578, "3": 0.009202526620212382, "2": 0.0003147940318959126, "1": 0}, "score": 4.63407895257614}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7674900605715627, "4": 0.20085279548527346, "3": 0.028865412497342, "2": 0.0024614885756290674, "1": 0.00030240753398429925}, "score": 4.73281484646864}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9412337135679403, "3": 0.050674041574751964, "1": 0.007946301330665428, "4": 0.00014067785469679033, "5": 5.315305866696118e-06}, "score": 2.043025039735579}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.61912825541346, "2": 0.2091975412432036, "4": 0.15056385485886942, "5": 0.017212121586096998, "1": 0.0038831767901516523}, "score": 2.9680237219611114}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962803702253227, "4": 0.003683201250213505, "3": 3.3569790086517454e-05, "2": 3.8915893636459043e-07, "1": 0}, "score": 4.996248482428149}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9513884243713563, "4": 0.04513684968067208, "3": 0.0031560807188835247, "2": 0.0002186550902542841, "1": 5.959177480763861e-05}, "score": 4.947654541840694}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9382569815132688, "4": 0.05850788777926504, "3": 0.002709619662177284, "2": 0.0003387524341884563, "1": 0.0001682398362301878}, "score": 4.934382441092093}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9411970626407321, "4": 0.05418462946295192, "3": 0.0037218266361140643, "2": 0.0005944826657226975, "1": 0.0002827393809486258}, "score": 4.935456068678502}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9958538813815951, "4": 0.0038699619655964295, "3": 0.00017082156940678166, "1": 6.394821133964066e-05, "2": 2.699418730870058e-05}, "score": 4.9954515540239575}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9686404486245412, "4": 0.030659834606255564, "3": 0.0006697547214457595, "2": 1.792213530268998e-05, "1": 7.799951829444824e-06}, "score": 4.967915553700839}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998287747907096, "4": 0.00016910360221666923, "3": 8.249335494309895e-07, "1": 1.212363367592587e-07, "2": 0}, "score": 4.999828761384058}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987759986015313, "4": 0.001221155179245388, "3": 1.7674548218204189e-06, "1": 7.14591413668916e-08, "2": 0}, "score": 4.998775022840619}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6048250114870094, "1": 0.3719416469689385, "3": 0.020291767846190967, "4": 0.0014230543025373842, "5": 0.0013151743981219227}, "score": 1.655071613214847}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5817784929509875, "4": 0.25289952589038683, "2": 0.0997204009077924, "3": 0.05135838832796575, "1": 0.014094776658263879}, "score": 4.288737825933483}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984448090646916, "4": 0.0015332789993339937, "3": 1.9402250373272843e-05, "1": 0, "2": 0}, "score": 4.998427912554475}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5749190446557157, "5": 0.2869789531166268, "3": 0.1342792758124971, "2": 0.0037349419600350847, "1": 5.8100226248022815e-05}, "score": 4.145059798693581}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4662980299649356, "5": 0.3966155323088718, "3": 0.10395449746057994, "2": 0.030042143493139987, "1": 0.003059768559587451}, "score": 4.223404150610644}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"4": 0.49807134458483077, "5": 0.4756484252822647, "3": 0.025761344133803182, "2": 0.00048714925665493486, "1": 0}, "score": 4.4489270301166846}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6228420398098916, "4": 0.36076976290544677, "3": 0.015753495528778826, "2": 0.0005742096410581696, "1": 0}, "score": 4.6059767818160635}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9787436162973037, "4": 0.021078493999711706, "3": 0.00016337530812878974, "2": 2.1469195728846492e-06, "1": 0}, "score": 4.978588049813547}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8333959246787838, "4": 0.16160246165460398, "3": 0.004775445552396915, "2": 0.00019127488042377448, "1": 0}, "score": 4.828266830273689}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7091531410035804, "4": 0.2795407502655066, "3": 0.01049267378616206, "2": 0.0005408595092477068, "1": 0}, "score": 4.697768942872407}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9909551192725968, "2": 0.009003553015957752, "3": 3.943806860067727e-05, "5": 5.40319070817441e-07, "4": 0}, "score": 1.0090846026875127}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.35408623281157803, "2": 0.3292448763694835, "1": 0.29222439377644815, "4": 0.017854048317005933, "5": 0.006528406454552189}, "score": 2.1171624240556546}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6557068794520163, "4": 0.3380933967240947, "3": 0.00611982119125455, "2": 5.8799159345919296e-05, "1": 0}, "score": 4.649483166292721}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9665692022669248, "4": 0.033252051983334335, "3": 0.00016044152692476081, "2": 4.539657451359529e-06, "1": 0}, "score": 4.9664129836797795}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7743603385861874, "5": 0.21692248526868924, "3": 0.008366279478947285, "2": 0.00026154113050541004, "1": 0}, "score": 4.208051714101092}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6724485204183515, "3": 0.21275678928604871, "5": 0.08668465504156783, "2": 0.02756654993918838, "1": 0.0005293223258686451}, "score": 3.8172042099647774}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.49970614666360313, "4": 0.3058857539034913, "2": 0.18090046791308773, "5": 0.01238780571892366, "1": 0.001111662095816954}, "score": 3.1475387776996864}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7269672286317935, "5": 0.2237482148909508, "3": 0.04809009731947395, "2": 0.0011428212421154488, "1": 0}, "score": 4.17338142814281}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5864835611565521, "5": 0.39280504456710974, "3": 0.020229814447295196, "2": 0.00043798933377334323, "1": 3.9748398777592666e-05}, "score": 4.371581433907658}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7384638712561742, "5": 0.22399438374687786, "3": 0.03566123266437547, "2": 0.0017506946971821767, "1": 0.00010712019887717949}, "score": 4.184514589099678}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9593916848338923, "3": 0.02405173605010573, "1": 0.015924268701359923, "4": 0.0005856631869064605, "5": 4.282151049369425e-05}, "score": 2.0094272943202025}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5577606507113518, "3": 0.2212115490061517, "2": 0.1440285982739038, "5": 0.07295604080287124, "1": 0.003821665334206047}, "score": 3.552123096361191}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9404707981550668, "4": 0.05898832712437304, "3": 0.0005237926280334062, "2": 7.190426999682006e-06, "1": 0}, "score": 4.939941922264143}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9291541990822192, "4": 0.06871080596884614, "3": 0.0019516228924463554, "2": 0.00013901746294873508, "1": 2.671955135615108e-05}, "score": 4.926860727837841}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5421955224861953, "5": 0.3722530179985915, "3": 0.07209863261420443, "2": 0.01205843335922333, "1": 0.0012700525517970293}, "score": 4.272261214239464}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9811159545942552, "4": 0.016882680584884978, "3": 0.001629478913895839, "2": 0.0002329354922562351, "1": 0.00013548169757702722}, "score": 4.97861755415059}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.41393463669532476, "5": 0.27986646507983404, "4": 0.19896783509700114, "2": 0.1033167259190315, "1": 0.0039054248702829627}, "score": 3.647578961039995}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.99773205947217, "4": 0.0022428262268168004, "3": 2.4153071540768312e-05, "2": 3.250492914879652e-07, "1": 0}, "score": 4.997707891024033}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999425902750013, "4": 5.66542812300384e-05, "3": 6.911928250056184e-07, "1": 2.6281751445072827e-08, "2": 0}, "score": 4.999941858203907}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9619444060068569, "4": 0.035438261825638154, "3": 0.0023682263015349127, "2": 0.0002028467074287744, "1": 3.89993725665976e-05}, "score": 4.959060450746375}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9517261653562631, "4": 0.04382498019876679, "3": 0.004358503563130314, "2": 7.145226168468604e-05, "1": 1.832528056140805e-05}, "score": 4.947170324478328}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8240045230082897, "4": 0.15857275006857627, "3": 0.014748945356601501, "2": 0.0020700709436447316, "1": 0.0006019184421437362}, "score": 4.803311120116688}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6740794679835344, "5": 0.23212046416148047, "3": 0.09188421749548792, "2": 0.0018416096131709323, "1": 7.278075442539739e-05}, "score": 4.136334884224201}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.995724443329193, "4": 0.004218973191883859, "3": 5.3236010580121824e-05, "2": 1.6485441382463646e-06, "1": 1.1607374756289055e-06}, "score": 4.9956649638715795}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5748395790885622, "5": 0.3162280020800119, "3": 0.10284352712122843, "2": 0.005749804642312784, "1": 0.00033768602983338914}, "score": 4.200872089014098}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"2": 0.881280954322679, "1": 0.0814139210765142, "3": 0.03542952737066394, "4": 0.0015851250164999003, "5": 0.0002819569946209}, "score": 1.9580313699389351}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9077271873379096, "4": 0.0899960498653575, "3": 0.002181075227831691, "2": 7.811956658798912e-05, "1": 1.0565094101778e-05}, "score": 4.905364517879214}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8792913588071612, "4": 0.11890906947731826, "3": 0.001766791657617489, "2": 1.9450690251899192e-05, "1": 0}, "score": 4.877497362253995}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9155940494467877, "4": 0.0830663992536463, "3": 0.0012810200555795133, "2": 2.7027086260236855e-05, "1": 0}, "score": 4.914287779085088}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5138173638080019, "5": 0.355315376279576, "3": 0.11830778534230538, "2": 0.011880656566908373, "1": 0.0006220621192717345}, "score": 4.211392089190518}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8627271952341224, "1": 0.0727327655974253, "3": 0.060531959332034806, "4": 0.003371242190543261, "5": 0.0006360165327958414}, "score": 1.9964497247989061}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5225836302794383, "3": 0.23688049630884314, "5": 0.1421567012347708, "2": 0.09569506014357046, "1": 0.0026219908063418473}, "score": 3.7060018486938566}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7607071483154214, "4": 0.23546690645674034, "3": 0.0035568285069924807, "2": 0.00020854056068198728, "1": 0}, "score": 4.7567790814579105}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9643947707240642, "4": 0.03385400400205869, "3": 0.0016206402366552481, "2": 7.048828726736963e-05, "1": 0}, "score": 4.962691008513696}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.48963581446491494, "5": 0.24909844480231275, "3": 0.19391778469019605, "2": 0.06299504540804354, "1": 0.004328325639881478}, "score": 3.9162035322406736}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5804027325134417, "4": 0.3932598223451207, "3": 0.025341834786041118, "2": 0.0009342616684804346, "1": 5.949162569143004e-05}, "score": 4.553014926495942}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4770936863198784, "4": 0.36134496326892757, "3": 0.1168430380503865, "2": 0.03625197196958749, "1": 0.008401979047412146}, "score": 4.262557665752276}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8862487513949822, "4": 0.10802517253379401, "3": 0.00548189738395909, "2": 0.0002024444560810707, "1": 3.0470608338606748e-05}, "score": 4.880280468421039}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981758309225478, "4": 0.0017860996553788894, "3": 3.606776600335533e-05, "2": 1.2131175793651375e-06, "1": 6.794786663147716e-07}, "score": 4.998135407341859}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9960446149243616, "4": 0.0038550912565122894, "3": 9.529826053395739e-05, "2": 3.627459561537619e-06, "1": 1.3111433698613674e-06}, "score": 4.995938185038912}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6577437244777934, "3": 0.22711688094099008, "5": 0.06299005639801462, "2": 0.051132278909272404, "1": 0.000997279984944796}, "score": 3.730611449369653}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6770718173082781, "3": 0.27378567136072834, "2": 0.03937694445781594, "5": 0.00940904329050879, "1": 0.00028835736394831684}, "score": 3.6559809604452096}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.48805051702148944, "3": 0.4088726011879443, "2": 0.09086901545386211, "5": 0.011634121383897387, "1": 0.0004525792373448146}, "score": 3.419595426440782}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.869182825299082, "4": 0.1284869675030458, "3": 0.00216538197764022, "2": 0.00010518740386006256, "1": 0}, "score": 4.866858766077634}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6497747335037273, "5": 0.3442992110848498, "3": 0.005792275844189732, "2": 0.00011833801435615792, "1": 8.761749135024159e-06}, "score": 4.338246233382998}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5872719961209039, "5": 0.38737761977726143, "3": 0.023886080394103046, "2": 0.0013309645154395745, "1": 0}, "score": 4.360877729497247}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7042507058177713, "4": 0.2871896155550196, "3": 0.0067046765736769025, "2": 0.0002422011448446331, "1": 0}, "score": 4.698187664654394}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5561833071212814, "4": 0.39457963340193475, "3": 0.0476931451004912, "2": 0.001398610549252324, "1": 0}, "score": 4.505766430720258}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9921066186448801, "4": 0.00786162461404821, "3": 2.807817426424752e-05, "2": 3.2603209809907575e-07, "1": 0}, "score": 4.992081214393127}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9993172262461523, "5": 0.0006720666774281631, "3": 6.282176883808238e-06, "2": 3.2551607205620785e-07, "1": 0}, "score": 4.000665136195048}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"5": 0.839091936376785, "4": 0.1329090525609406, "3": 0.018429299807847646, "1": 0.004736060533099298, "2": 0.004508462917849616}, "score": 4.797696930446593}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.729123887289264, "4": 0.25452161890952635, "3": 0.015659836955497837, "2": 0.0006096198449925951, "1": 7.958451652915578e-05}, "score": 4.712009939317131}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5546682453995035, "5": 0.22765929222552642, "3": 0.20710395783906016, "2": 0.009950113707375485, "1": 0.0005756363692555775}, "score": 3.998928152037668}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9929174825836576, "4": 0.006916381159293086, "3": 0.0001412466365862486, "1": 1.1601176993990483e-05, "2": 8.33487532401471e-06}, "score": 4.992729680219561}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944062108286319, "4": 0.0054999185276938525, "3": 7.995280778811322e-05, "2": 3.4153451542164943e-06, "1": 0}, "score": 4.994329870270782}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"2": 0.855603962954915, "3": 0.08018249939129532, "1": 0.06048061974844009, "4": 0.0031141594582285484, "5": 0.000617150895963182}, "score": 2.0277816959076995}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9765974309150592, "4": 0.023057130687623006, "3": 0.000326251826785669, "2": 1.2924807904516938e-05, "1": 4.968577381387881e-06}, "score": 4.976231686188734}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9692992269676373, "4": 0.030055839823300685, "3": 0.00057227804044003, "2": 5.5043652814435716e-05, "1": 1.4665349845591584e-05}, "score": 4.968575719156846}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6556946309619094, "3": 0.16812929205503677, "5": 0.1375163169759651, "2": 0.03804934914792907, "1": 0.000607662213673527}, "score": 3.891465041659926}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8046352820542491, "4": 0.19282498788327734, "3": 0.0024301021147056217, "2": 9.168039468305191e-05, "1": 1.1507563996320036e-05}, "score": 4.8019924612808875}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8213473889283346, "5": 0.1452687214984973, "3": 0.03175805134886039, "2": 0.001571392672928602, "1": 0}, "score": 4.110373894171306}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9337119472275554, "4": 0.06489155415676172, "3": 0.0013743711471584576, "2": 2.034494662517859e-05, "1": 1.0607970483438208e-06}, "score": 4.9322943766560225}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9549401076219832, "4": 0.04456519971401427, "3": 0.0004920189135677375, "2": 1.9998507603770493e-06, "1": 0}, "score": 4.954444732206889}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.996553185948925, "4": 0.003420758393519468, "3": 2.3746913353330013e-05, "2": 5.067079676488293e-07, "1": 0}, "score": 4.996530221403203}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9866247690839686, "4": 0.013294567311788828, "3": 7.396666790145404e-05, "2": 1.4094077179709193e-06, "1": 0}, "score": 4.986553200028914}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6036299465994348, "4": 0.34454402596098843, "3": 0.04465631269080971, "2": 0.006611022151056642, "1": 0.0005295248303848095}, "score": 4.544178887598534}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9955632588451857, "4": 0.004422055260075593, "3": 1.383773883633587e-05, "2": 1.679927522235942e-07, "1": 0}, "score": 4.995549762257108}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9959552116814037, "4": 0.004031269259021151, "3": 1.2548568031151163e-05, "2": 1.644918190823255e-07, "1": 0}, "score": 4.995943136859628}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6300731406911865, "5": 0.3398302672470429, "3": 0.029820834066494366, "2": 0.0002663551471572805, "1": 7.462015544595716e-06}, "score": 4.309454937439823}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8655737475204239, "4": 0.13295161685375023, "3": 0.0014589022640488607, "2": 1.3716596979446324e-05, "1": 1.6558998183444227e-06}, "score": 4.864082756180167}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8273794186436051, "1": 0.15770857674979408, "3": 0.014122185195540395, "4": 0.00042161414944420203, "5": 0}, "score": 1.8572042586013153}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6538722715758317, "4": 0.2506929739346022, "3": 0.06338015367889949, "2": 0.025058098757751224, "1": 0.006820216928054457}, "score": 4.5200069390854525}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9439011587807151, "4": 0.054885603290610846, "3": 0.0009790155813336457, "2": 4.70878289047989e-05, "1": 0}, "score": 4.943004436222627}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992068903778301, "4": 0.000774609907881819, "3": 1.0927347127627543e-05, "1": 1.8013521150952714e-06, "2": 0}, "score": 4.999196325351384}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9151497736982273, "4": 0.07608459999253785, "3": 0.008112736863730352, "2": 0.000562808573042385, "1": 6.641902642381641e-05}, "score": 4.905733593937992}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"3": 0.47521524035207996, "4": 0.3627998406369263, "2": 0.14283579431750706, "5": 0.017774294405035095, "1": 0.0013704830637691224}, "score": 3.2527727678619667}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9321235021864852, "4": 0.0666371865934632, "3": 0.0010901539000515426, "2": 6.885463601864095e-05, "1": 0}, "score": 4.930970398436099}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9599078890786973, "4": 0.03929141624975288, "3": 0.0007494662286068735, "2": 1.7778512371917387e-05, "1": 0}, "score": 4.959154949491813}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.983298961828501, "4": 0.016397375294147906, "3": 0.0002672981114838974, "2": 1.5035838097168247e-05, "1": 0}, "score": 4.983022558857979}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9479915341391065, "4": 0.05104438656331136, "3": 0.0009139451493161601, "2": 3.8761812884095435e-05, "1": 6.013076761887814e-06}, "score": 4.946987101282523}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8830838345674263, "1": 0.11338216218696485, "3": 0.003487645891574786, "4": 1.896041828377895e-05, "5": 0}, "score": 1.8901403947246302}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5404163056790423, "3": 0.30273119876400706, "4": 0.14056976013696332, "5": 0.008946664479625327, "1": 0.007277848472104829}, "score": 2.6034679994011443}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9907991017083639, "4": 0.009096584186927152, "3": 9.786995013784576e-05, "2": 3.832188530820508e-06, "1": 0}, "score": 4.990696155045877}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989585639713053, "4": 0.0010341449799574278, "3": 5.085948585704541e-06, "2": 4.515747132173574e-07, "1": 0}, "score": 4.998954326565117}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.4444407627780619, "2": 0.2364890907549783, "3": 0.1994448543821745, "5": 0.09012793662469659, "1": 0.029363907348903668}, "score": 3.3295237048906783}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5936065813562386, "5": 0.33556721495448083, "3": 0.05584876871470072, "2": 0.01376003366356386, "1": 0.001119348230634089}, "score": 4.248864736174731}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7073219089145103, "5": 0.20879225846041635, "3": 0.07832667164125766, "2": 0.005225136275687951, "1": 0.0003035036260772043}, "score": 4.119108438707983}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8947362427304015, "4": 0.10440069985125341, "3": 0.0008526685975270589, "2": 5.756436142536585e-06, "1": 0}, "score": 4.893876202039009}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6375334581208079, "5": 0.2573559841991109, "3": 0.09001759749884407, "2": 0.013196978197880438, "1": 0.0017369970327256793}, "score": 4.135755022211834}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7988339476767925, "4": 0.19246279820665174, "3": 0.008265492176469968, "2": 0.0003091648277954225, "1": 0.00010590691606312259}, "score": 4.789650322417309}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5323834918422725, "5": 0.4370422223080188, "3": 0.029200752485166327, "2": 0.001249359323827415, "1": 0}, "score": 4.4053930904733205}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7849642136075226, "4": 0.20300424273222728, "3": 0.010697138534087216, "2": 0.0010446169664913682, "1": 0.0002663508855090192}, "score": 4.771396867923808}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9919922313781054, "4": 0.007954349444367936, "3": 4.578001114467781e-05, "2": 1.0460232134259132e-06, "1": 0}, "score": 4.991950899394831}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9865944791819005, "4": 0.013269683257346775, "3": 0.0001243493021143012, "2": 4.639759615836147e-06, "1": 0}, "score": 4.986467606182992}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7173644564968777, "4": 0.26856924568905616, "3": 0.012377115941153002, "2": 0.0013921958919436606, "1": 0}, "score": 4.70241155515659}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9571112697085514, "3": 0.027234868404787838, "1": 0.015313844353754491, "4": 0.00023916269629345666, "5": 0.00010018621035417466}, "score": 2.0126999165661807}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8147826324212043, "4": 0.17909669920227791, "3": 0.005640556771463008, "2": 0.0003659208151571608, "1": 5.79258971288321e-05}, "score": 4.8082819342243965}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.650143520302438, "4": 0.33086024940344294, "3": 0.017157532310716733, "2": 0.0015689228153063744, "1": 0.00018085264035081538}, "score": 4.629361548859847}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5213059361853687, "4": 0.2589141343127689, "3": 0.14894045258461164, "2": 0.047733061880543215, "1": 0.022862158557174245}, "score": 4.2083637783711145}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9622213636912544, "4": 0.036806894529875976, "3": 0.000903182428531278, "2": 4.3469457191915565e-05, "1": 1.5794480727538944e-05}, "score": 4.961192793589587}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5533151047860702, "2": 0.26517478616047435, "4": 0.17729155467556446, "1": 0.002328469719316072, "5": 0.0018874699452768495}, "score": 2.911234536870775}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5386539319664795, "3": 0.21722115433843942, "5": 0.1609626545855997, "2": 0.07991577591140962, "1": 0.003163826709544455}, "score": 3.774399820977099}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.6725353996545477, "4": 0.23690624661829593, "2": 0.07633636871967785, "5": 0.013466130470807993, "1": 0.0007422273203933179}, "score": 3.186020219137206}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9548853290539108, "4": 0.043290645784614584, "3": 0.0016009389149584205, "2": 0.00013205659199768286, "1": 7.347171909557036e-05}, "score": 4.952816591289851}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8423123934076838, "4": 0.1549937477458504, "3": 0.0025198094384016566, "2": 0.00013823740842636734, "1": 2.1383039433640684e-05}, "score": 4.839464072627824}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8424375029347563, "3": 0.12310360020960709, "1": 0.03060336832810092, "4": 0.00316498171706949, "5": 0.0006659263360984596}, "score": 2.1008304568176177}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9046369780342407, "4": 0.09235914978354934, "3": 0.0027174943991537825, "2": 0.0002245610387968976, "1": 5.212340384462568e-05}, "score": 4.901322728173986}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5485728452346582, "5": 0.3967723295499696, "3": 0.05246100223392084, "2": 0.0019772025239596326, "1": 0}, "score": 4.340430666514854}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999254260847726, "4": 7.408073840544005e-05, "3": 2.499404868557943e-07, "1": 1.5608503110536898e-08, "2": 0}, "score": 4.9999253569296185}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9988227271300747, "4": 0.0011718459950528983, "3": 4.602200496715186e-06, "2": 9.265508516206988e-08, "1": 0}, "score": 4.998818670773943}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4868246608751432, "2": 0.2971962749597166, "4": 0.17876447887305125, "1": 0.019218312086077854, "5": 0.017913398976199056}, "score": 2.878948345630954}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9253571295330969, "3": 0.0484406471771218, "1": 0.023337805025785745, "4": 0.00270991231690387, "5": 0.00013656552798941204}, "score": 2.030932918318631}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987327137862458, "4": 0.0012470874330834751, "3": 8.356666118988982e-06, "1": 4.1236168355312526e-07, "2": 0}, "score": 4.9987345353239965}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9931172052816192, "4": 0.006815759327575274, "3": 4.999167831938696e-05, "2": 2.530562368211179e-06, "1": 0}, "score": 4.993076565147832}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9617403751905163, "4": 0.03564547744703273, "3": 0.0019348269268288547, "2": 0.000323003467340153, "1": 0.0002820980083687093}, "score": 4.9583843775956025}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.49453934790152315, "5": 0.4572293289771831, "3": 0.038780706933564134, "2": 0.008309448816933981, "1": 0.0011228835545602207}, "score": 4.3984683592683265}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5280267466630864, "5": 0.4101732695086279, "3": 0.05275200488761873, "2": 0.008495403724768967, "1": 0.0005431831511315016}, "score": 4.33880408978803}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6362025891274732, "5": 0.3492251974408781, "3": 0.014475162924613457, "2": 8.390393873525469e-05, "1": 0}, "score": 4.3345866253047145}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6084377089469761, "3": 0.1811742325419325, "5": 0.1561384758140387, "2": 0.05151287513173074, "1": 0.002705826143011244}, "score": 3.8638168090489793}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9350746867561643, "4": 0.06296966981650481, "3": 0.0018219990528232897, "2": 0.00010147947466306426, "1": 2.7834800599926463e-05}, "score": 4.932970264206051}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6584719207091962, "3": 0.2721823861716832, "5": 0.04858850493612183, "2": 0.020569036838826302, "1": 0.00017278353322013978}, "score": 3.7347456181079304}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6917470326168362, "3": 0.19846990548423618, "5": 0.10241405704173463, "2": 0.007321488680742504, "1": 4.6735804284945385e-05}, "score": 3.8891608802873954}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.560541330815167, "4": 0.4199397837530587, "3": 0.01904992717978877, "2": 0.0004274644632257525, "1": 2.3906838744973223e-05}, "score": 4.540574261245204}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7740262199978292, "4": 0.22452570039001826, "3": 0.0013975876999783765, "2": 3.658277707616641e-05, "1": 0}, "score": 4.77256621247152}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.936781176784387, "4": 0.06249285804807724, "3": 0.0006932485257835265, "2": 2.6446069813026898e-05, "1": 3.1349353691281075e-06}, "score": 4.9360285663582735}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6338351652930122, "1": 0.3515310626300401, "3": 0.013978637606016146, "5": 0.0003241925268425806, "4": 0.0003175373845337877}, "score": 1.6640507240734947}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9565208663725001, "4": 0.04158619573820374, "3": 0.0017044189808810568, "2": 0.000166747477619932, "1": 1.9605214131292084e-05}, "score": 4.954426204287933}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8006635320710638, "4": 0.17981347776376186, "3": 0.01848805187758673, "2": 0.0009254883627905566, "1": 8.670135896186369e-05}, "score": 4.780082145141045}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9210452431426348, "4": 0.07764500954730624, "3": 0.0012267887450500491, "2": 6.89962777827255e-05, "1": 1.0610674874102811e-05}, "score": 4.919651712133435}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7741651469497692, "5": 0.1716858715735285, "3": 0.05115141107326051, "2": 0.0029317229243088017, "1": 6.321215179857998e-05}, "score": 4.114481679892955}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6874196424375815, "5": 0.24558199393345326, "3": 0.06366472738429942, "2": 0.0031554681830645143, "1": 9.922753615347179e-05}, "score": 4.175322487623861}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9190565079469313, "4": 0.07827529053930994, "3": 0.0022219813080917813, "2": 0.00013291788851317092, "1": 0}, "score": 4.916855943953549}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7276340032437717, "5": 0.23877671752939758, "3": 0.03219316873583561, "2": 0.0007187377568109147, "1": 0}, "score": 4.205285127828265}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9861391515543091, "4": 0.012645485562909812, "3": 0.0011321098084212755, "2": 4.7836242235310865e-05, "1": 3.2522090234389674e-05}, "score": 4.984816653780736}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99277658468281, "4": 0.007083727689625985, "3": 0.00010804248808611533, "2": 2.998959988200924e-06, "1": 0}, "score": 4.99269098107877}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9148110571021184, "1": 0.04513119890083826, "3": 0.03679835632081559, "4": 0.0028035354431939765, "5": 0.0004373935045364604}, "score": 1.9985863827263972}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7851215126454809, "4": 0.2100039371724878, "3": 0.004698590541630587, "2": 0.00010958281425369918, "1": 0}, "score": 4.78025554736216}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9690607282524106, "4": 0.030557574081029902, "3": 0.00035535243013728784, "2": 7.239025210970919e-06, "1": 0}, "score": 4.968709406138368}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.779048668073979, "4": 0.21954722972995955, "3": 0.0013556964113027158, "2": 2.37063645372417e-05, "1": 0}, "score": 4.777664766802469}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9535203449909251, "4": 0.04529082978444211, "3": 0.0011132362111064577, "2": 4.504241304358085e-05, "1": 0}, "score": 4.952346114890025}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6487301255251313, "4": 0.34911028633805935, "3": 0.0021225140929772308, "2": 2.7761899468742883e-05, "1": 0}, "score": 4.646558108475662}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6196390548910773, "4": 0.3719194278386406, "3": 0.008258375347167595, "2": 0.00017001328107414015, "1": 8.977303492272224e-06}, "score": 4.611016257606629}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6978859744160446, "4": 0.298702973202931, "3": 0.003365963590893632, "2": 3.090838659637265e-05, "1": 0}, "score": 4.694468041889034}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.763133160991801, "5": 0.2173079732569777, "3": 0.018459677874101743, "2": 0.001005942164011007, "1": 6.76526521584432e-05}, "score": 4.196638485679127}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7657724622803745, "4": 0.2288005078167854, "3": 0.0053052679459568985, "2": 0.00011104533684453629, "1": 0}, "score": 4.760253251005953}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7908982216291552, "1": 0.1923389882361362, "3": 0.016034205418684166, "4": 0.0005989702662874453, "5": 0.00010781303375282609}, "score": 1.8252127862076248}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.799856781872543, "4": 0.0751308063446453, "2": 0.05587199546123828, "1": 0.037125823510658996, "3": 0.031851668887024204}, "score": 4.544972440579497}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.951185174337153, "4": 0.04768802313176204, "3": 0.0009987732320778828, "2": 0.00011050641327531649, "1": 9.96206677862974e-06}, "score": 4.949942684422841}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992853203052766, "4": 0.0007121442989655865, "3": 1.8017205292718718e-06, "2": 1.4571830452940104e-07, "1": 0}, "score": 4.9992838146839755}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.48961620983939097, "5": 0.420476549187758, "3": 0.07034753043626608, "2": 0.01827831307068017, "1": 0.0011516333959931797}, "score": 4.3101577397527775}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.505020503268133, "5": 0.29598553325232724, "3": 0.1575674592055246, "2": 0.03866441929167667, "1": 0.0026919969505032003}, "score": 4.053016960466353}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5756219330623785, "5": 0.2444538843309674, "3": 0.15207377713568077, "2": 0.026768276641687426, "1": 0.0009931166783160297}, "score": 4.035867396511077}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8208765797516525, "5": 0.12476608684485761, "3": 0.05227798151998812, "2": 0.0019556542241809726, "1": 0}, "score": 4.0685852807151965}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7719354395347497, "4": 0.21304501448299898, "3": 0.013403017644870492, "2": 0.0013960204859504825, "1": 0.00014864784585713134}, "score": 4.755348716743402}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7495079008505369, "3": 0.14458657729765992, "5": 0.10004662016322632, "2": 0.0057748418975306975, "1": 6.95771047140119e-05}, "score": 3.9437008123928883}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7504097187110425, "3": 0.16228902961489503, "1": 0.04575757166866282, "4": 0.03858225975482366, "5": 0.002933832471215847}, "score": 2.202503061479307}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9492158236950592, "4": 0.05047508655375805, "3": 0.00029470933277239345, "2": 6.682676346373816e-06, "1": 0}, "score": 4.948915053512917}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5631130678565434, "5": 0.4240227582808317, "3": 0.012670488876935474, "2": 0.00017089931090571162, "1": 0}, "score": 4.411019836146401}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9832935409162671, "4": 0.01667098159549695, "3": 3.3372011110356455e-05, "2": 3.124207499787154e-07, "1": 0}, "score": 4.983261307106613}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995479799918402, "4": 0.0004482672335172493, "3": 2.3254104427249062e-06, "1": 1.3912347343854177e-07, "2": 0}, "score": 4.999546524867519}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6101111837384272, "3": 0.1523023483441441, "2": 0.12875412514376333, "5": 0.10122579128538729, "1": 0.007578611314526979}, "score": 3.6686701012951963}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9490631014610231, "4": 0.050417512198529586, "3": 0.0004762569683139802, "2": 2.657156231390626e-05, "1": 0}, "score": 4.948549407268772}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9896660529611835, "4": 0.010212416449796079, "3": 0.00010699873992217303, "2": 1.8758249912089726e-06, "1": 0}, "score": 4.989567826565547}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978070709898331, "4": 0.0021779946736451535, "3": 1.3391130140407656e-05, "2": 5.479389288023767e-07, "1": 0}, "score": 4.997793577053307}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986676710393575, "4": 0.0013217165110445477, "3": 6.7796844391049496e-06, "2": 4.0319158134819705e-07, "1": 0}, "score": 4.998663509961744}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8245209153423361, "1": 0.15811080409576045, "3": 0.0172910370729723, "4": 5.8844275601009754e-05, "5": 0}, "score": 1.8592953326732233}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9681129254373265, "4": 0.03139849239872621, "3": 0.00046463263354799063, "2": 1.001538647475438e-05, "1": 0}, "score": 4.967641745290175}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9180938816481893, "4": 0.08106597091970652, "3": 0.0008192548912527992, "2": 7.954760527672872e-06, "1": 0}, "score": 4.917270584681204}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5899197312893201, "5": 0.40213840844749293, "3": 0.007832919325192029, "2": 9.040608327185044e-05, "1": 0}, "score": 4.394131982134788}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9935144177669438, "4": 0.006439389767209866, "3": 4.171828650432734e-05, "2": 1.5527717472032812e-06, "1": 0}, "score": 4.993472496275042}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"1": 0.8852867058729695, "2": 0.11113086590439407, "3": 0.0033375031881676532, "4": 0.00015257016032661533, "5": 8.888030331532967e-05}, "score": 1.1186195161268808}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.655460851941785, "4": 0.31125200171843886, "3": 0.02782704192407534, "2": 0.005130293032940136, "1": 0.00026626406927215886}, "score": 4.616613615882764}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7851475948153535, "4": 0.21128858046488547, "3": 0.0033546870218130608, "2": 0.00014614840206412147, "1": 0}, "score": 4.781549840263549}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8173770950171171, "4": 0.16319130762048323, "3": 0.01580508903478734, "2": 0.003073596207026206, "1": 0.0005070111816904594}, "score": 4.793940222624852}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5703385198302587, "4": 0.27106801818025994, "3": 0.11102350981068672, "2": 0.038654437427329706, "1": 0.00868749537904376}, "score": 4.35602482958599}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.26826244641042285, "4": 0.26803894281940066, "5": 0.2561223804752553, "2": 0.18067542310757587, "1": 0.026602342584119476}, "score": 3.546566726315203}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6365431695206293, "5": 0.24886437739497774, "3": 0.10407625784775786, "2": 0.010164686230624833, "1": 0.0002811399415399385}, "score": 4.123624026568445}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6197173016545439, "5": 0.3074852685615677, "3": 0.06772552087572155, "2": 0.004664858861080514, "1": 0.0002014200559432597}, "score": 4.229873038586744}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3655118423159303, "4": 0.35566023497276855, "2": 0.22643994787661523, "5": 0.042701842918289476, "1": 0.009552290598534545}, "score": 3.195545563811626}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5544402127037306, "5": 0.24990625785954512, "3": 0.12525611723627833, "2": 0.06479117326165135, "1": 0.0052775906589497676}, "score": 3.9792281955052995}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5721009312123068, "3": 0.24423214306125626, "5": 0.10582985669320742, "2": 0.0767261262143625, "1": 0.0010645370171735301}, "score": 3.704938157570358}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.9376257563752073, "3": 0.04814858637228646, "1": 0.013431521281398047, "4": 0.0007319725095263879, "5": 5.5768631842760166e-05}, "score": 2.036348548448248}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9995159401947685, "4": 0.00048010967047677793, "3": 9.768653639284993e-07, "1": 0, "2": 0}, "score": 4.999517935165486}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984638228299204, "4": 0.0015140839142112645, "3": 1.245656829843993e-05, "2": 7.097216400874785e-07, "1": 0}, "score": 4.998458860026568}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989530898931649, "4": 0.0010342631894841826, "3": 1.136656962237871e-05, "2": 4.571793830426392e-07, "1": 0}, "score": 4.998941631261906}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9257609139055081, "1": 0.04152602250271111, "3": 0.03224354857299797, "4": 0.00022367778533712756, "5": 0}, "score": 1.9911627091058166}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.649760282674348, "4": 0.3411994074605205, "3": 0.008888873081298277, "2": 8.908843766301322e-05, "1": 0}, "score": 4.640733181371918}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9739776180679379, "4": 0.02590754603523055, "3": 0.0001004087703939917, "2": 1.2198325045462042e-06, "1": 0}, "score": 4.973887632052748}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9657678775845414, "4": 0.03387150427300747, "3": 0.00033103250003180935, "2": 8.906956119902104e-06, "1": 0}, "score": 4.965438995182391}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9638816939703085, "4": 0.034345828800058036, "3": 0.0016965128488985487, "2": 5.9636008313146906e-05, "1": 1.2428877030579293e-05}, "score": 4.962032373914499}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"1": 0.9821229989087501, "2": 0.017777796285956833, "3": 7.925167577536274e-05, "5": 2.0499339189336874e-06, "4": 0}, "score": 1.0179448206428172}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.7827737950032858, "2": 0.2169476063469657, "3": 0.0002512867099525567, "5": 1.8650065365911972e-06, "4": 0}, "score": 1.217463173563881}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5032620350970263, "5": 0.40560520254498006, "3": 0.06965435874675889, "2": 0.016047390954050927, "1": 0.005220718201800143}, "score": 4.288254525613194}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7078859753671183, "4": 0.2558859094633607, "3": 0.030980252301943356, "2": 0.0038592168681040114, "1": 0.0012652586642972932}, "score": 4.665473624353213}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.5181513644730891, "1": 0.3175895351282798, "3": 0.1255007806639205, "4": 0.023697858347704034, "5": 0.014755086620768902}, "score": 1.8995415446160262}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4860605180973083, "4": 0.4718344011397526, "2": 0.033291971738376204, "5": 0.008678899882410995, "1": 0.00013103802627197514}, "score": 3.4556395979996184}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"1": 0.6683571450770796, "2": 0.3010321528013695, "3": 0.026505397168271137, "5": 0.0031268411540182985, "4": 0.0009645093804046492}, "score": 1.369448995341226}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.613063377083154, "4": 0.3692549840115977, "3": 0.016915877517978403, "2": 0.0007168315372441432, "1": 4.078027701205744e-05}, "score": 4.59459634136595}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"3": 0.3819064674360416, "4": 0.36005740568798933, "5": 0.15107567632418067, "2": 0.09429744349967333, "1": 0.012640617988036373}, "score": 3.542642228112221}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.41366641120509173, "3": 0.3025276502207671, "4": 0.266390686902949, "2": 0.015351218914359371, "1": 0.0020554065829907846}, "score": 4.074270744078984}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9434305837614374, "3": 0.043922555418154124, "1": 0.011790297871426155, "4": 0.0007973099969735016, "5": 5.2319782915108474e-05}, "score": 2.0338840718134197}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.5462788277782905, "3": 0.32089708972820086, "4": 0.0804310325722893, "1": 0.036770808348392726, "5": 0.015429552731009663}, "score": 2.4913716865585998}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5116668240701698, "4": 0.4653903561341502, "3": 0.02216713483135418, "2": 0.0007191328836529678, "1": 0}, "score": 4.488089025921479}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6789920363432177, "4": 0.2937693921126708, "3": 0.02485499849466942, "2": 0.0021961202460073614, "1": 0.00017876311651095594}, "score": 4.649214149474706}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7940167676586379, "4": 0.19629991710247288, "3": 0.00895959996280837, "2": 0.0006323732833269113, "1": 6.2491375671457e-05}, "score": 4.783627555140691}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8219801439469598, "3": 0.14006075307029697, "5": 0.02265254661590416, "2": 0.015138653068847182, "1": 0.0001204641330955078}, "score": 3.8519460714538956}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9381354700910576, "4": 0.061324993182965214, "3": 0.0004841772496519693, "2": 4.114159106840762e-05, "1": 0}, "score": 4.937582340097399}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9824676146208018, "4": 0.017400853887003895, "3": 0.00012107008078333379, "2": 1.5152638132562394e-06, "1": 0}, "score": 4.9823523022810825}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.941782653308186, "4": 0.05787274098465972, "3": 0.00033496148597073023, "2": 5.976998733606265e-06, "1": 0}, "score": 4.941439190291682}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8930272227212628, "4": 0.10627188669155761, "3": 0.0006782544808227151, "2": 1.5873888998198314e-05, "1": 0}, "score": 4.892323254546244}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7942952622871146, "4": 0.20227241520259268, "3": 0.0031518471537274806, "2": 0.00022174954248023633, "1": 3.6895388043503896e-05}, "score": 4.790606489160785}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.845429480330122, "4": 0.1530658129618919, "3": 0.001457092889288431, "2": 3.5731210764755435e-05, "1": 0}, "score": 4.843910952882287}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9952775137696805, "4": 0.004689093494315492, "3": 3.242265989962143e-05, "2": 5.412059211120505e-07, "1": 0}, "score": 4.995244435528602}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9610141844760639, "4": 0.03852167149811581, "3": 0.0004325059389544628, "2": 1.7806909532569345e-05, "1": 0}, "score": 4.960559350384758}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9855573256294413, "4": 0.014350241609776828, "3": 8.471321052924657e-05, "2": 2.7128630628479612e-06, "1": 0}, "score": 4.985472120643428}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4000197732383721, "3": 0.37036660854143166, "5": 0.17754629272244918, "2": 0.05072022666073906, "1": 0.0013140088812505235}, "score": 3.7017873363719422}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9981406846723203, "4": 0.0018200474623849044, "3": 2.9897012468535426e-05, "2": 2.4120838886463752e-06, "1": 0}, "score": 4.9981129091291825}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9737867712442728, "4": 0.025774779600956463, "3": 0.00041263505488223435, "2": 1.650490415011705e-05, "1": 0}, "score": 4.973350187488506}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996929481000866, "4": 0.0002998080864033278, "3": 4.054148013976297e-06, "1": 2.54429004647538e-07, "2": 0}, "score": 4.999691064994752}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995310681829088, "4": 0.00046307130928634487, "3": 3.872562985390205e-06, "1": 2.3074976084239007e-07, "2": 0}, "score": 4.99952825973676}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9430261878024253, "1": 0.03844448601293122, "3": 0.018114879619614752, "4": 0.000356361568740025, "5": 5.309605108478261e-05}, "score": 1.9805423078240578}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9920346935223456, "4": 0.007676568051440268, "3": 0.00021503344151538057, "2": 2.1864024254590584e-05, "1": 0}, "score": 4.991827349314704}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6615894510524891, "4": 0.33358812688607337, "3": 0.004748414054263396, "2": 5.2565633881818016e-05, "1": 0}, "score": 4.6567499880088645}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8963038277638228, "4": 0.10041031881137255, "3": 0.0030795262769841934, "2": 0.0001507826744358271, "1": 0}, "score": 4.892972335816107}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"2": 0.4488898249862171, "3": 0.18444375738422347, "4": 0.1599076848415043, "5": 0.13415230768297254, "1": 0.07241904222609843}, "score": 2.834453370164931}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9263985521893109, "1": 0.040795675330155254, "3": 0.03233519220251382, "4": 0.0002243794423821649, "5": 0}, "score": 1.9919863027781703}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7488219055798929, "4": 0.2248122431577768, "3": 0.023086438771824057, "2": 0.002572305758517392, "1": 0}, "score": 4.721100750486144}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7244705983735081, "5": 0.2175371366086618, "3": 0.05702300477644218, "2": 0.000906688506120082, "1": 0}, "score": 4.158710685622983}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9917909636790666, "4": 0.008127970642903793, "3": 6.200199475307762e-05, "2": 3.230909116873127e-06, "1": 0}, "score": 4.991738201833054}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9643605015647674, "4": 0.03467523276647082, "3": 0.0009052473832143755, "2": 3.800605761581354e-05, "1": 0}, "score": 4.963399485235894}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.42708983562558805, "2": 0.2935740123363874, "4": 0.26935806172724686, "5": 0.007833530316727757, "1": 0.002115233649518422}, "score": 2.987220267942453}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9424243388166162, "4": 0.05642311861188291, "3": 0.0011012283944731092, "2": 3.486681641937602e-05, "1": 8.458311420107464e-06}, "score": 4.941235521431922}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6003935872956336, "4": 0.3825093314750201, "3": 0.016687939601626747, "2": 0.0003808837300058168, "1": 2.4339062207721577e-05}, "score": 4.582873147231357}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9909409526794748, "4": 0.00893417918256729, "3": 0.00011085938073473374, "1": 4.733569447474678e-06, "2": 4.51983983266086e-06}, "score": 4.990811564564467}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970013659111735, "4": 0.002978832004779773, "3": 1.6493503200830945e-05, "2": 7.197038708683902e-07, "1": 0}, "score": 4.996986014074367}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5225005199625655, "4": 0.43325656395464024, "3": 0.027399399003705558, "2": 0.009737781104116477, "1": 0.006838824628856331}, "score": 4.4552305910739145}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.950326347209287, "4": 0.03803306751101258, "3": 0.008944879798089545, "2": 0.00204197255415184, "1": 0.000619959936848041}, "score": 4.935469236086078}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999482009803268, "4": 0.0005106510896977083, "3": 3.7458462446236914e-06, "1": 0, "2": 0}, "score": 4.999481855355984}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994353328845156, "4": 0.0005583562826300116, "3": 4.80435384562923e-06, "1": 1.6583724190785947e-07, "2": 0}, "score": 4.999431370898383}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9693261069772033, "4": 0.02844682852554252, "3": 0.0020879288191254447, "2": 9.910694880147816e-05, "1": 2.5123296371334802e-05}, "score": 4.966979007612129}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7188248163318585, "1": 0.27697207227212023, "3": 0.00408089643597521, "4": 4.916134077206171e-05, "5": 0}, "score": 1.7271872168842082}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5146343399583353, "3": 0.4492874749962572, "2": 0.023858422006956054, "5": 0.01210925188447051, "1": 7.269681387780189e-05}, "score": 3.5148684975050375}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5633268323538402, "3": 0.4072408335165302, "2": 0.02148919560841761, "5": 0.007880065996161676, "1": 5.1645783590000176e-05}, "score": 3.557500847588616}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9168327881245574, "3": 0.06748831548593083, "5": 0.014376411583596331, "2": 0.0012904116538528098, "1": 1.0083975280501956e-05}, "score": 3.9442769100210415}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.49125118676252816, "4": 0.2665832503781097, "2": 0.2389541228688247, "5": 0.0024774157460183983, "1": 0.0007276389358784009}, "score": 3.031128879897071}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"2": 0.4469867173101027, "1": 0.21371727121750003, "5": 0.14859123979761785, "3": 0.11366253954661251, "4": 0.07646268767081903}, "score": 2.498933517218093}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9832331498648755, "4": 0.016499833319089337, "3": 0.0001820156291725569, "2": 5.693263068195293e-06, "1": 0}, "score": 4.983117716734526}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9914615652695625, "4": 0.008473330807339316, "3": 5.150081114655894e-05, "2": 1.7170926793772344e-06, "1": 0}, "score": 4.991418414291436}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957680560191755, "4": 0.0041477925579617, "3": 4.76875118703548e-05, "1": 2.8575898448627107e-06, "2": 0}, "score": 4.995745259072728}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9769072381946884, "4": 0.022920295375051174, "3": 0.00015062759886389765, "2": 4.451911515380283e-06, "1": 0}, "score": 4.976764689702197}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"2": 0.3128523265294903, "3": 0.28683710578975447, "5": 0.19303962505208536, "1": 0.1330397264830079, "4": 0.07354414064720124}, "score": 2.8806095810242365}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7774342845344427, "4": 0.1972237515698953, "3": 0.02300243267886021, "2": 0.0020070839127541967, "1": 0.0003033974183955055}, "score": 4.749529265514345}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9557573673370616, "4": 0.042477999326132505, "3": 0.001651041959120059, "2": 6.898692942045173e-05, "1": 0}, "score": 4.954010904649142}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9956143047727543, "4": 0.004312758743205623, "3": 6.318339681176728e-05, "2": 4.010033349888326e-06, "1": 0}, "score": 4.995548818799747}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7289422487013126, "4": 0.25376417198462226, "3": 0.01576426514718266, "2": 0.0012680423810305323, "1": 0.00021983550408280798}, "score": 4.710011812529345}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"3": 0.4759882071274276, "2": 0.23692960672584681, "4": 0.21524475564278026, "5": 0.061668069141216406, "1": 0.010051860874254357}, "score": 3.0815571484556394}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9851368425625435, "4": 0.0147368885997687, "3": 0.00011356036638597629, "2": 2.4208447704769348e-06, "1": 0}, "score": 4.985028574112709}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9969961515079656, "4": 0.002973400594040848, "3": 2.7105415936246036e-05, "2": 4.3795617003078887e-07, "1": 0}, "score": 4.996971065907959}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992170036517487, "4": 0.0007697648341180865, "3": 1.0913172632293455e-05, "1": 6.331145294295372e-07, "2": 0}, "score": 4.999205875024219}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999043260567298, "4": 0.0009242749182522559, "3": 2.9199061196841075e-05, "1": 1.1558575753718993e-06, "2": 0}, "score": 4.999012701446253}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5244276245949406, "5": 0.3945953103621906, "3": 0.07354312574506315, "2": 0.007069265458611172, "1": 0.0003247769236748085}, "score": 4.305951529451204}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.49549604850834894, "3": 0.2505688615066832, "1": 0.11232153190975135, "5": 0.07140994025992706, "4": 0.0700845996663102}, "score": 2.4927049905453007}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.835625201490879, "4": 0.16088973892709685, "3": 0.0033747794666750407, "2": 6.778931305496622e-05, "1": 0}, "score": 4.832150202127812}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7637759286041896, "4": 0.2259375828352669, "3": 0.009543649686145484, "2": 0.0005964781186496354, "1": 7.504947464319326e-05}, "score": 4.752867862228574}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9581419200199214, "4": 0.0405298070104575, "3": 0.0012276021301563151, "2": 6.47975347053686e-05, "1": 2.006073772870058e-05}, "score": 4.956739669117317}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9738699751404278, "4": 0.022163663729833936, "3": 0.0032416964192923, "2": 0.0004413050051156384, "1": 0.0002572335836649164}, "score": 4.9689992841531}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995459544199067, "4": 0.000437018644071317, "3": 1.1164393451860815e-05, "1": 1.2950179524669765e-06, "2": 0}, "score": 4.999535470375465}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9815152195177059, "4": 0.01781076908233591, "3": 0.000643291238022462, "2": 1.0444803248925873e-05, "1": 0}, "score": 4.980870926183039}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999156521574794, "4": 8.250348690513601e-05, "3": 1.219188602988775e-06, "1": 1.2553967410574198e-07, "2": 0}, "score": 4.999914555934502}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997595390553684, "4": 0.0002371587049024466, "3": 2.6648734164296924e-06, "1": 1.8105771302731766e-07, "2": 0}, "score": 4.999756787206432}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.3952610682982541, "3": 0.26017947438716477, "2": 0.17395674545676387, "5": 0.15835468817910103, "1": 0.01110415074024038}, "score": 3.5163960892312174}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6892953190419969, "5": 0.2628363983156643, "3": 0.03859675011375623, "2": 0.009087640276845872, "1": 0.00017101624602162166}, "score": 4.205553965624188}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9270310211059265, "4": 0.0727265544844616, "3": 0.00023764300247601804, "2": 1.974913417130026e-06, "1": 0}, "score": 4.926792029312625}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9845338791013798, "4": 0.01531376778472415, "3": 0.00014225960005917812, "2": 4.871376558148674e-06, "1": 0}, "score": 4.984387017352344}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7368353996998037, "4": 0.2593268613544605, "3": 0.0037567776387309572, "2": 4.11815177730651e-05, "1": 0}, "score": 4.733025418622181}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"2": 0.6344920763041486, "1": 0.3375525760207161, "3": 0.02468069795891044, "4": 0.002753592104082594, "5": 0.0004888363925669454}, "score": 1.694091958593888}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.7555633492677829, "1": 0.12176452771380109, "3": 0.10628900847162594, "4": 0.014105944143117475, "5": 0.002084098273526709}, "score": 2.0189923307543953}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9319183643798977, "4": 0.0673074937560853, "3": 0.0007355890140682466, "2": 2.4911325961961825e-05, "1": 0}, "score": 4.931145654959693}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959301414139738, "4": 0.0040445377980767175, "3": 2.1579387096441728e-05, "2": 1.1190035009474656e-06, "1": 0}, "score": 4.995908935688831}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.48645355964042664, "3": 0.2901983570466516, "5": 0.12992118261111688, "2": 0.08505241206413272, "1": 0.00834221091518229}, "score": 3.6445798965391867}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8144578922041364, "3": 0.10191433209677785, "1": 0.07355427572807344, "4": 0.008413289836320908, "5": 0.0009408426011598735}, "score": 2.0480437249407384}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8360374502090576, "4": 0.15215617781696472, "3": 0.009734626574100203, "2": 0.001461316408275303, "1": 0}, "score": 4.823883112956247}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7418618493570626, "5": 0.14057933326358993, "3": 0.09098391011695021, "2": 0.02508305400742193, "1": 0.0012675902777322659}, "score": 3.995625563274395}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9847093278398165, "4": 0.014959292505009764, "3": 0.00023323197472526004, "2": 3.362657099811964e-05, "1": 0}, "score": 4.984472361972113}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7546997431690786, "3": 0.12475065423444154, "2": 0.059251498982749895, "5": 0.05907219139960066, "1": 0.0018051588238782448}, "score": 3.8103232555947644}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"1": 0.7001100584082439, "2": 0.29904449618240203, "3": 0.0008226703370903003, "5": 1.4286678904444168e-05, "4": 6.794256058631809e-06}, "score": 1.3007678758824537}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8187834073457921, "4": 0.10609590815863416, "2": 0.07188317839302916, "5": 0.002926119899356687, "1": 0.0003078071830768267}, "score": 3.039449496388706}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7687479857710973, "4": 0.2277226358513134, "3": 0.0034425193722463472, "2": 7.032765155483727e-05, "1": 1.0051506843717645e-05}, "score": 4.765139614562804}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.977404778663063, "4": 0.021969995443106502, "3": 0.000616625307332372, "2": 6.791532108140871e-06, "1": 9.523902116009205e-07}, "score": 4.976772549886933}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8333768651319331, "4": 0.09626781808368548, "2": 0.05415152735126748, "5": 0.01596965372233503, "1": 0.00023197429264551765}, "score": 3.073591808654467}]