[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6973706503576829, "5": 0.3020676439799393, "3": 0.0005608974879869207, "2": 7.086691942815232e-07, "1": 1.8430296085206348e-08}, "score": 4.301505298307187}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9640090870650431, "4": 0.03597458363526765, "3": 1.6269668693024492e-05, "2": 3.3005256509443134e-08, "1": 0}, "score": 4.963992777052858}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6122549183157565, "5": 0.3874531270332991, "3": 0.00029160628633092097, "2": 3.713191134428774e-07, "1": 0}, "score": 4.3871607692216585}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994284230123979, "4": 0.0005713166206349672, "3": 1.7826190351390982e-07, "1": 0, "2": 0}, "score": 4.999428326808621}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9996626874526736, "5": 0.0003273412019575454, "3": 9.04726550548717e-06, "2": 1.5679352884545657e-07, "1": 0}, "score": 4.000317980593377}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7131397749376647, "4": 0.28658451358275855, "3": 0.0002747760927849064, "2": 7.727246974373989e-07, "1": 0}, "score": 4.7128635693513665}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.681585368568172, "5": 0.3176589995552706, "3": 0.0007543918726247875, "2": 1.1134402626047126e-06, "1": 2.427892856557509e-08}, "score": 4.316902340379608}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8307965081384716, "5": 0.16811599355399787, "3": 0.0010863280839604587, "2": 1.0153136280970775e-06, "1": 0}, "score": 4.167027660717027}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9942276464234845, "4": 0.005770947502913618, "3": 1.389548060529021e-06, "2": 1.1306398867942326e-08, "1": 0}, "score": 4.994226239451635}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9919257145772383, "4": 0.008073170492009894, "3": 1.042450881969725e-06, "1": 0, "2": 0}, "score": 4.991924744020933}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8412994400522494, "5": 0.15469842537907588, "3": 0.00399749645524309, "2": 4.3435394532600746e-06, "1": 0}, "score": 4.150692286234953}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7753395860897554, "4": 0.22448582816638726, "3": 0.0001741128335911857, "2": 3.5207838552099533e-07, "1": 0}, "score": 4.775164862764021}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5967332636428851, "4": 0.4029705486414974, "3": 0.00029566958323249423, "2": 4.2602747391431585e-07, "1": 0}, "score": 4.5964367969394635}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9877435082227597, "4": 0.01225351186769499, "3": 2.9438538549230253e-06, "1": 0, "2": 0}, "score": 4.987740599982574}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9535011574940785, "4": 0.04648374487891436, "3": 1.4987050945416902e-05, "2": 3.603176234917618e-08, "1": 0}, "score": 4.953486169456567}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9781890499700524, "4": 0.02179156305331627, "3": 1.9161279651407627e-05, "2": 7.676600024184232e-08, "1": 0}, "score": 4.978169880838199}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9426776559935011, "5": 0.05442763814500094, "3": 0.0028925089635718484, "2": 2.1574836332429747e-06, "1": 2.6989336321806232e-08}, "score": 4.0515307338864215}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7159037631955112, "4": 0.28144061860379854, "2": 0.0025283018680409158, "5": 0.00012574757920809287, "1": 1.2575036907333555e-06}, "score": 3.2791613837757034}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5394744791698352, "4": 0.4599844336329266, "3": 0.000540012106074914, "2": 8.096854484083007e-07, "1": 0}, "score": 4.538932990728759}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9398811339111396, "4": 0.059989309958023616, "3": 0.00012880975623455476, "2": 4.6696244503271815e-07, "1": 0}, "score": 4.939751652808052}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6297485413428849, "5": 0.3698219150081014, "3": 0.0004291450861748215, "2": 5.104669203357367e-07, "1": 0}, "score": 4.369391707651646}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9483227946487328, "4": 0.05166857065618316, "3": 8.543455557324834e-06, "1": 0, "2": 0}, "score": 4.948314337716927}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5008905073429895, "4": 0.49869035844187415, "3": 0.0004188381456088584, "2": 2.4973162392565223e-07, "1": 0}, "score": 4.500471192924918}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9572310836104334, "4": 0.04276315549763461, "3": 5.712047597877282e-06, "2": 1.2894306236884188e-08, "1": 0}, "score": 4.957225380186501}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9872651463234179, "4": 0.012729132688982061, "3": 5.63761756077701e-06, "2": 1.845740854322599e-08, "1": 0}, "score": 4.987259535876654}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9418808825941672, "4": 0.058111075794293594, "3": 7.9935867022994e-06, "2": 1.0024096424854672e-08, "1": 0}, "score": 4.941872904751139}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8750364555558691, "4": 0.12491784471977505, "3": 4.561239765486522e-05, "2": 8.308655011412589e-08, "1": 0}, "score": 4.874990680695206}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9876726806630456, "4": 0.012325413622273292, "3": 1.8326290183792195e-06, "2": 2.8973653873477023e-09, "1": 0}, "score": 4.987670911562237}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969373848033503, "4": 0.0030622562442295595, "3": 3.8023285331972596e-07, "1": 0, "2": 0}, "score": 4.996936983355246}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.988971588771567, "4": 0.011027523444326481, "3": 8.126518889236006e-07, "1": 0, "2": 0}, "score": 4.988970850423251}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.82931227167826, "5": 0.16871044106996977, "3": 0.001975622974974334, "2": 1.6467959604879829e-06, "1": 0}, "score": 4.1667315274176815}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9483022124741564, "3": 0.03652146898282952, "5": 0.014614559808951853, "2": 0.0005605491106122721, "1": 1.0887056983352478e-06}, "score": 3.976968723702912}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9881794877210475, "4": 0.011818446564078076, "3": 1.9269502234041528e-06, "2": 6.791445713489128e-09, "1": 0}, "score": 4.988177677600908}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9930275054253395, "4": 0.006971157493942351, "3": 1.3363066242685195e-06, "2": 1.0095016002421032e-08, "1": 0}, "score": 4.993026139672764}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9915117275534537, "4": 0.00848624552221794, "3": 1.9979677879800166e-06, "1": 0, "2": 0}, "score": 4.991509758296357}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6980525308180062, "4": 0.3018616437078982, "3": 8.562622113953137e-05, "2": 1.159630767950852e-07, "1": 0}, "score": 4.6979667308042785}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9805048361769211, "4": 0.01948897612876193, "3": 6.16421352777981e-06, "2": 2.18526203086997e-08, "1": 0}, "score": 4.980498629854571}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6464446883241963, "5": 0.3523485128074669, "3": 0.0012038586973353528, "2": 2.8319472746909075e-06, "1": 8.290876919511974e-08}, "score": 4.351138750378338}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9346252380135558, "4": 0.06532689886696456, "3": 4.749386562501996e-05, "2": 2.6599881049447327e-07, "1": 2.5410204287421522e-08}, "score": 4.93457720867171}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9930580752545949, "4": 0.006940461556323772, "3": 1.4804521649365478e-06, "1": 0, "2": 0}, "score": 4.993056577659211}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9866374117747612, "4": 0.013354231207100933, "3": 8.18323507166328e-06, "2": 4.001425785377519e-08, "1": 0}, "score": 4.986629280491397}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945420241696994, "4": 0.0054571440163761215, "3": 8.330251526311184e-07, "2": 1.749737605442886e-09, "1": 0}, "score": 4.99454118470027}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7268234705389746, "5": 0.271942943835669, "3": 0.001231231488883911, "2": 2.3283586050222673e-06, "1": 3.523069913195769e-08}, "score": 4.27070694737853}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961440755423071, "4": 0.003855218091101046, "3": 6.999751517731392e-07, "1": 0, "2": 0}, "score": 4.996143381933947}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9774536276423387, "4": 0.022529903674046694, "3": 1.6342802036043343e-05, "2": 9.122927441320236e-08, "1": 0}, "score": 4.9774371362522025}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7983448037135781, "5": 0.200754281271321, "3": 0.0008996398872403017, "2": 1.1942323069307836e-06, "1": 0}, "score": 4.199852269086628}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9938011451702303, "4": 0.00619589687728305, "3": 2.889445334611502e-06, "1": 0, "2": 0}, "score": 4.993798323807189}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8212764768560927, "4": 0.1784171734029157, "3": 0.00030505605846493564, "2": 1.1728064572364645e-06, "1": 0}, "score": 4.82096917442024}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9877943358481696, "4": 0.012203574235833665, "3": 1.989233836790296e-06, "1": 0, "2": 0}, "score": 4.98779244606741}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7947618412204381, "4": 0.20500364900044013, "3": 0.00023406890971441814, "2": 4.5880617167743027e-07, "1": 0}, "score": 4.79452684044714}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9642721576529247, "4": 0.035665294710105044, "3": 6.183549534796276e-05, "2": 3.9351407538823363e-07, "1": 0}, "score": 4.964209842353243}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9903702577955036, "4": 0.009627593312831792, "3": 2.0667380807019317e-06, "1": 0, "2": 0}, "score": 4.990368272419726}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7969813585409727, "4": 0.20288448526650635, "3": 0.00013410050524638936, "2": 1.2817093938760607e-07, "1": 0}, "score": 4.796846943935462}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9901565708346846, "4": 0.00984192457649945, "3": 1.4522100347370534e-06, "2": 7.286467327077881e-09, "1": 0}, "score": 4.990155148700103}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6996865429604396, "4": 0.29965187344101196, "3": 0.0006586363478342695, "2": 2.5381654542425466e-06, "1": 1.1515463035286352e-07}, "score": 4.699022690281985}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9177802923118367, "5": 0.07987950238385964, "3": 0.002339142195360124, "2": 9.254312424695655e-07, "1": 0}, "score": 4.077538520001339}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8843457667162972, "4": 0.11563068694151617, "3": 2.3454246313451758e-05, "2": 2.0766618899673395e-08, "1": 0}, "score": 4.884322334014799}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8280789656514184, "4": 0.17188533181324608, "3": 3.563230100078347e-05, "2": 4.8997184483845566e-08, "1": 0}, "score": 4.8280432529413275}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962494837211796, "4": 0.0037502465293525237, "3": 2.682849969533223e-07, "1": 0, "2": 0}, "score": 4.996249216895161}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.989729459927324, "3": 0.005495131832821808, "5": 0.004724575326807654, "2": 4.997018651877792e-05, "1": 5.053942596955161e-07}, "score": 3.999127986626571}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9920292978603211, "4": 0.007968906480879393, "3": 1.6990589822751259e-06, "1": 0, "2": 0}, "score": 4.992027694631033}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9987453188713707, "4": 0.001254244976237, "3": 4.082969943599686e-07, "1": 0, "2": 0}, "score": 4.998744938394815}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9173654759694393, "4": 0.0825882384698498, "3": 4.607550933468161e-05, "2": 9.971736526199112e-08, "1": 0}, "score": 4.9173193022368915}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999340081435584, "4": 6.594714302880685e-05, "3": 2.6853007797830406e-08, "1": 0, "2": 0}, "score": 4.9999339991497775}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993382964624098, "4": 0.0006613987813164501, "3": 1.962811042203517e-07, "1": 0, "2": 0}, "score": 4.999338208584687}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9778595017593449, "4": 0.022130567086727174, "3": 9.836486241009405e-06, "2": 6.45978957640691e-08, "1": 0}, "score": 4.977849565481044}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9843359870073687, "4": 0.015661760101554716, "3": 2.266141392293335e-06, "2": 6.8315517020124045e-09, "1": 0}, "score": 4.984333687435615}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8148438248946477, "5": 0.18311820604401008, "3": 0.002035183484049568, "2": 2.6668848221297727e-06, "1": 3.780161539184489e-08}, "score": 4.1810775900329915}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998566603941031, "4": 0.0001433100633278852, "3": 1.2267123981917287e-08, "1": 0, "2": 0}, "score": 4.999856665399949}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9236446031080263, "4": 0.07633698704676867, "3": 1.8316688019933217e-05, "2": 2.7390050772107376e-08, "1": 0}, "score": 4.923626292384159}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.547002393983644, "3": 0.45167332172432334, "2": 0.0009746876473358707, "5": 0.00034904754951978363, "1": 4.316252940386983e-07}, "score": 3.5467250024084818}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5199596638159767, "4": 0.4797846795476285, "3": 0.00025524415507662424, "2": 3.663366930689992e-07, "1": 0}, "score": 4.519703710969047}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8397967170031877, "5": 0.15887883679377454, "3": 0.0013225301457151547, "2": 1.772497480464168e-06, "1": 0}, "score": 4.157552784271351}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8943347349556525, "4": 0.1056352982323156, "3": 2.982349655905685e-05, "2": 7.143913560824578e-08, "1": 0}, "score": 4.894304832860177}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8033541971072491, "3": 0.19036513269433114, "5": 0.005642041561395041, "2": 0.0006374734046487245, "1": 8.204941961450734e-07}, "score": 3.8139994383136884}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7693953133403112, "5": 0.2296647137358397, "3": 0.0009382435448144904, "2": 1.4865894818296562e-06, "1": 5.6820310267614575e-08}, "score": 4.228723369086643}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7245381076890748, "4": 0.27533850803221877, "3": 0.0001233120405608548, "2": 8.807747606253972e-08, "1": 0}, "score": 4.724414608019321}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.820783965472092, "5": 0.17831937408087317, "3": 0.0008961408129741884, "2": 4.878382211954057e-07, "1": 1.0211278420730555e-08}, "score": 4.177422230787203}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.772302072397944, "4": 0.22754262397695837, "3": 0.00015512675516235732, "2": 1.9482365906637504e-07, "1": 1.6264841856516973e-08}, "score": 4.772146480779193}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5873284356716081, "4": 0.4124702075239735, "3": 0.00020099932663207273, "2": 2.2267957103658747e-07, "1": 0}, "score": 4.587127070129514}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.535280484165034, "4": 0.24488048592688083, "2": 0.21507331693173695, "5": 0.0039259445775512046, "1": 0.0008395328095156038}, "score": 3.0359800010077174}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995420893224987, "4": 0.0045787190654799845, "3": 3.805181349269459e-07, "1": 0, "2": 0}, "score": 4.995420519865317}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9821663458638588, "4": 0.017831627010148243, "3": 2.0660313771315307e-06, "1": 0, "2": 0}, "score": 4.982164241621004}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998064914551942, "4": 0.00019343364968139445, "3": 3.112205827130302e-08, "1": 0, "2": 0}, "score": 4.999806504097732}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999523684704165, "4": 0.00047611444593290207, "3": 7.764458700154024e-08, "1": 0, "2": 0}, "score": 4.9995237302062145}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"5": 0.909983419469883, "4": 0.0899801669642635, "3": 3.6199400501562365e-05, "2": 1.677337392867832e-07, "1": 0}, "score": 4.909946926852206}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7778766227210945, "4": 0.22211002761531992, "3": 1.3334578625062203e-05, "2": 8.744245588063864e-09, "1": 0}, "score": 4.7778632755861885}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982083786730485, "4": 0.0017913500957363055, "3": 2.5510056423045827e-07, "1": 0, "2": 0}, "score": 4.998208139674231}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999819001822147, "4": 0.00018092336755946053, "3": 4.125741428807943e-08, "1": 0, "2": 0}, "score": 4.999818994111538}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984820076177358, "4": 0.001517748943576142, "3": 2.0731322979086128e-07, "1": 0, "2": 0}, "score": 4.99848183637512}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"3": 0.565575376800509, "4": 0.4244439583360283, "2": 0.007815619872156754, "5": 0.002158693071282334, "1": 6.238230434595372e-06}, "score": 3.4209332960013006}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5270073413934225, "4": 0.47272540413979686, "3": 0.00026688492099068243, "2": 2.839811426810796e-07, "1": 0}, "score": 4.526739933580463}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9331104775981353, "5": 0.04664274889988203, "3": 0.02021505207167135, "2": 3.114203635970892e-05, "1": 2.2123928137380927e-07}, "score": 4.026364758480308}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9123207419516851, "4": 0.0876675552142572, "3": 1.160715313886761e-05, "2": 1.4355251550228939e-08, "1": 0}, "score": 4.912309180282197}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9059707755742265, "3": 0.08257958367597729, "5": 0.011105297858259464, "2": 0.00034316025642966923, "1": 8.581327750117175e-07}, "score": 3.92783679585397}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7938462152962946, "5": 0.19006866069915623, "3": 0.01594711569935408, "2": 0.0001369206495914105, "1": 9.397866082063932e-07}, "score": 4.173844910047068}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6369719875281042, "4": 0.35785317586038884, "3": 0.00507312997394193, "2": 9.871012827713156e-05, "1": 2.740500472627327e-06}, "score": 4.631693377515264}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.664086312001061, "5": 0.33187267256411795, "3": 0.004015547810175853, "2": 2.4625181509232177e-05, "1": 6.012987125584828e-07}, "score": 4.327806149543411}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9723260970441359, "4": 0.027574614334405882, "3": 9.72292466787539e-05, "2": 1.6987837570138462e-06, "1": 1.4469337337054834e-07}, "score": 4.972225246050968}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9234764042695595, "5": 0.06345510062194298, "3": 0.013003184369712224, "2": 6.40574641571483e-05, "1": 9.763565496315271e-07}, "score": 4.050320886189031}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9293989928388179, "5": 0.04814919786321635, "3": 0.02241145201714248, "2": 4.0075154668504944e-05, "1": 2.777506689413138e-07}, "score": 4.025656762396991}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7875027785272515, "4": 0.21230144582586558, "3": 0.00019516757684700424, "2": 6.171109546215568e-07, "1": 0}, "score": 4.787306369610522}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5528580893569132, "4": 0.4470303676942434, "3": 0.00011143077632496313, "2": 5.675131551344012e-08, "1": 0}, "score": 4.552746575711837}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9859905589763882, "4": 0.014008709999444854, "3": 6.658659253237312e-07, "1": 0, "2": 0}, "score": 4.985989957355835}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6545539484905482, "4": 0.34531273302937265, "3": 0.00013313192554240228, "2": 1.1703076359512303e-07, "1": 0}, "score": 4.654420628001269}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6150927681689959, "5": 0.38396125113063045, "3": 0.0009444970446855726, "2": 1.5415826106130623e-06, "1": 0}, "score": 4.383013648733922}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8700469180452228, "4": 0.1299209617452942, "3": 3.200149300009331e-05, "2": 6.546664897064645e-08, "1": 0}, "score": 4.87001483194707}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7517445777321277, "5": 0.24769109348411517, "3": 0.0005639392641174349, "2": 3.847573350314192e-07, "1": 1.0788015444855429e-08}, "score": 4.247126350852169}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997464409015432, "4": 0.00025349942580617506, "3": 4.035074415086061e-08, "1": 0, "2": 0}, "score": 4.999746419867805}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.958628296618414, "5": 0.03921472362610494, "3": 0.0021509449968295197, "2": 5.859571968272676e-06, "1": 1.1469825804265926e-07}, "score": 4.0370517176317655}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8829176449986823, "4": 0.11699228342405192, "3": 8.975749718409858e-05, "2": 2.5434696452322003e-07, "1": 0}, "score": 4.882827431541605}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9254063320797123, "5": 0.07344114072813687, "3": 0.0011519178845748833, "2": 5.266587665118336e-07, "1": 0}, "score": 4.072288175500559}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6956878086965732, "5": 0.303592116661009, "3": 0.0007192295416078, "2": 8.728815254460438e-07, "1": 3.465891005229736e-08}, "score": 4.302871018468469}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993494905730591, "4": 0.0006502941883528553, "3": 1.3397669098490894e-07, "1": 0, "2": 0}, "score": 4.999349437805399}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998846623019038, "4": 0.00011525321276386565, "3": 2.593501112982732e-08, "1": 0, "2": 0}, "score": 4.999884694910462}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5551941314501698, "4": 0.4442260386663416, "3": 0.0005783091330484165, "2": 1.4455726750476804e-06, "1": 0}, "score": 4.554612972866335}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9671725451424722, "5": 0.026853610440752955, "3": 0.005967692155109476, "2": 6.092561238748917e-06, "1": 1.312666735455049e-08}, "score": 4.02087369475533}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5839967273630532, "4": 0.4158395875239164, "3": 0.00016353148783868076, "2": 1.444728119055024e-07, "1": 0}, "score": 4.583832912273052}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9940214838777778, "4": 0.005978084978593687, "3": 4.531706824399073e-07, "1": 0, "2": 0}, "score": 4.994021008811741}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9870581375407017, "5": 0.007483741586209544, "3": 0.005455853554419386, "2": 2.2280785069666214e-06, "1": 0}, "score": 4.002023431954177}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9312189333554981, "4": 0.06875757270946832, "3": 2.3340535218147413e-05, "2": 6.902390107070952e-08, "1": 0}, "score": 4.931195533342953}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5417504272056194, "4": 0.45788903769343314, "3": 0.0003600202061121268, "2": 4.5808457880577754e-07, "1": 0}, "score": 4.541389521586828}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9629651912453197, "5": 0.020622831328477136, "3": 0.016389260601929318, "2": 2.254293150302449e-05, "1": 1.1845555618647378e-07}, "score": 4.004188129729052}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999741197265207, "4": 0.00025876221675168474, "3": 2.9680665392908407e-08, "1": 0, "2": 0}, "score": 4.999741178419113}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9862342140333367, "4": 0.013752431969502888, "3": 1.3167537996046234e-05, "2": 8.105418137723626e-08, "1": 0}, "score": 4.986220988339585}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9981074289753733, "4": 0.0018918690939316912, "3": 6.894166718677839e-07, "2": 3.514020547055877e-09, "1": 0}, "score": 4.998106741513625}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8671824032134812, "4": 0.13277332872826553, "3": 4.422558898886442e-05, "2": 3.1326545493470076e-08, "1": 0}, "score": 4.867138124633677}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8590802661310352, "4": 0.14081459260049475, "3": 0.00010496506263347273, "2": 1.3995008690687043e-07, "1": 0}, "score": 4.8589750523110125}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9946225724062469, "4": 0.005377167125965484, "3": 2.721582876560043e-07, "1": 0, "2": 0}, "score": 4.994622288620327}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986617260882734, "4": 0.0013379750027489317, "3": 2.1085661167520761e-07, "1": 0, "2": 0}, "score": 4.998661603166179}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9402677724271611, "5": 0.0359135829461559, "3": 0.02375586337556328, "2": 6.249237554146672e-05, "1": 2.3820385411318492e-07}, "score": 4.012032020817632}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.751795434973038, "5": 0.24615033790951876, "3": 0.002039779836978252, "2": 1.4064706269922953e-05, "1": 2.6058545169593e-07}, "score": 4.244081676678864}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9467622720426067, "4": 0.05321844139170591, "3": 1.9157754300294036e-05, "2": 3.9543875869275526e-08, "1": 0}, "score": 4.946743119713956}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999901944987707, "4": 9.792927730194438e-05, "3": 2.3861012169268726e-08, "1": 0, "2": 0}, "score": 4.9999020229906925}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.983764938603626, "4": 0.01622958123010768, "3": 5.389435012317246e-06, "2": 1.8234854351906635e-08, "1": 0}, "score": 4.9837595840179345}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.853471584682134, "5": 0.143639268820289, "3": 0.0028825481549314387, "2": 6.291550595907822e-06, "1": 1.2008728302736835e-07}, "score": 4.140743803579856}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8923699189735602, "5": 0.10523731881468384, "3": 0.002388653406659402, "2": 3.974915770077893e-06, "1": 3.025165328238183e-08}, "score": 4.102840635479688}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6239393942056801, "5": 0.37484217809905473, "3": 0.0012166360071209246, "2": 1.5789286666400599e-06, "1": 2.7455865840451258e-08}, "score": 4.373622371100579}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.997335153224857, "4": 0.0026646288482832904, "3": 2.4064476380109553e-07, "1": 0, "2": 0}, "score": 4.997334889922734}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9980557626827278, "4": 0.0019439097478980078, "3": 2.712722249903424e-07, "1": 0, "2": 0}, "score": 4.9980555475981845}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9895443998012524, "4": 0.010450666737239149, "3": 4.84992168775443e-06, "2": 2.231486028321381e-08, "1": 0}, "score": 4.989539565834364}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9211944277108544, "5": 0.04359836191891634, "3": 0.034891497642946745, "2": 0.0003147742004965985, "1": 8.505182222516816e-07}, "score": 4.0080747650309565}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9965675084145783, "4": 0.0034307976287965627, "3": 1.6342819898638427e-06, "2": 1.5087066248497258e-08, "1": 0}, "score": 4.996565888392906}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997453683241494, "4": 0.0002545829097443357, "3": 3.403518481213426e-08, "1": 0, "2": 0}, "score": 4.999745349016135}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999721898777316, "4": 0.0002780206962784211, "3": 5.3554661197672066e-08, "2": 1.0915032089476445e-09, "1": 0}, "score": 4.999721868912691}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"4": 0.906555487463768, "5": 0.08650045542753115, "3": 0.006934665915915675, "2": 8.936522737308667e-06, "1": 0}, "score": 4.079547952634213}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9471560991047817, "4": 0.05283351689424104, "3": 1.0262541903779082e-05, "1": 0, "2": 0}, "score": 4.947145951602349}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8421606055461589, "4": 0.15780267797872666, "3": 3.6681207179792436e-05, "2": 3.114207618984259e-08, "1": 0}, "score": 4.842123865529311}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995586998615626, "4": 0.00044120929644000993, "3": 3.210949680315539e-08, "1": 0, "2": 0}, "score": 4.99955872645865}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9542268781888538, "4": 0.04576184562544736, "3": 1.1213759577364266e-05, "2": 1.7284944058446793e-08, "1": 0}, "score": 4.954215672933807}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9805118291623497, "3": 0.014177458574484297, "5": 0.005304615438129598, "2": 6.062083530865847e-06, "1": 0}, "score": 3.9911150323879068}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8373661407480739, "4": 0.16254431608872522, "3": 8.936459350830891e-05, "2": 8.983286038592641e-08, "1": 0}, "score": 4.837276670786124}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9153458930032072, "5": 0.08203663198075979, "3": 0.0026139975527223447, "2": 3.2089204044266583e-06, "1": 3.077121998121989e-08}, "score": 4.07941614315648}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988569813440326, "4": 0.0011429221576864843, "3": 1.0621845153104515e-07, "1": 0, "2": 0}, "score": 4.9988568654165215}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951704270734322, "4": 0.00482879173981709, "3": 7.773796467903309e-07, "1": 0, "2": 0}, "score": 4.995169653482501}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7361802318504066, "5": 0.2578809331507107, "3": 0.00592362314237117, "2": 1.4864525836571358e-05, "1": 1.6798250497825265e-07}, "score": 4.2519271221918205}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9949029691708808, "4": 0.005095621690632633, "3": 1.3528771650496697e-06, "2": 1.3843085096516153e-08, "1": 0}, "score": 4.994901630809518}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.61217858100934, "5": 0.3868384789997048, "3": 0.0009810038243367864, "2": 1.7992385686066912e-06, "1": 0}, "score": 4.385853929532456}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9966424559993594, "4": 0.0033569112453973875, "3": 6.369701772335315e-07, "1": 0, "2": 0}, "score": 4.996641814828402}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9811449882071627, "4": 0.018853268215200034, "3": 1.7734593212230358e-06, "1": 0, "2": 0}, "score": 4.981143185429631}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6952611490266626, "5": 0.2999763922267078, "3": 0.004731788639842359, "2": 3.0011467480223583e-05, "1": 4.993577820595053e-07}, "score": 4.295183129595778}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8636659645820728, "5": 0.13388172741645493, "3": 0.002445917428633907, "2": 6.283703638284155e-06, "1": 1.4032383195614045e-07}, "score": 4.131422817212346}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7543796523432968, "5": 0.243619280033393, "3": 0.0019948793632849895, "2": 5.756004426015463e-06, "1": 1.6295316642022407e-07}, "score": 4.241612464868582}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988996835925147, "4": 0.0010993727380079787, "3": 8.84631201729941e-07, "2": 1.2270473363934193e-08, "1": 0}, "score": 4.998898821136669}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9527652910248408, "4": 0.04719939048157315, "3": 3.510131372956977e-05, "2": 2.0642349034578492e-07, "1": 2.835906797192673e-08}, "score": 4.95272967501631}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8904468264953911, "4": 0.10950024415522336, "3": 5.2686463236229015e-05, "2": 1.2781396866471908e-07, "1": 0}, "score": 4.890393986863796}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6140386775908407, "4": 0.38566682110944817, "3": 0.00029426789442326995, "2": 3.366974783888606e-07, "1": 0}, "score": 4.613743672906533}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7154613139506064, "4": 0.28434994461696494, "3": 0.00018860682513595575, "2": 1.9006912788170806e-07, "1": 0}, "score": 4.7152722873169}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999930118027176, "4": 6.8969380894616545e-06, "3": 4.8833616086547445e-09, "1": 0, "2": 0}, "score": 4.9999930932945915}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8828577993373458, "4": 0.11703971000687144, "3": 0.00010203619037615256, "2": 4.318489338587237e-07, "1": 0}, "score": 4.882754919413904}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7662195741435104, "3": 0.2160504356877756, "4": 0.011345946901726535, "1": 0.006161512474499862, "5": 0.00022253993262262478}, "score": 2.233248434682674}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8379772054530696, "4": 0.16187121970091592, "3": 0.00015126640562398457, "2": 3.005369887091237e-07, "1": 0}, "score": 4.837825344595139}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.784392504827071, "4": 0.21547170012232117, "3": 0.0001352375089189921, "2": 4.327346994811803e-07, "1": 0}, "score": 4.784256499729445}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992293838772358, "4": 0.0007701621352673727, "3": 3.444044994062835e-07, "1": 0, "2": 0}, "score": 4.999229148971262}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9981304671576839, "4": 0.0018680329502704155, "3": 1.4224269862944568e-06, "2": 1.6623690839523296e-08, "1": 0}, "score": 4.998129072210854}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7198648449068004, "4": 0.2796138317689624, "3": 0.0005192791282537515, "2": 1.7236403864976194e-06, "1": 6.462561420653271e-08}, "score": 4.719342108722145}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.875563351069757, "4": 0.12426705000989416, "3": 0.00016839014150525823, "2": 1.1413497553582392e-06, "1": 8.192161184553222e-08}, "score": 4.87539241977726}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6464434342227174, "4": 0.35303940478242096, "3": 0.0005151047396592034, "2": 1.8428191723783644e-06, "1": 6.400760068084634e-08}, "score": 4.645924548341402}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9765427468963752, "4": 0.02344917420144766, "3": 8.00425726264161e-06, "2": 2.4708216421105852e-08, "1": 0}, "score": 4.976534741987599}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998675064280487, "4": 0.00013230085821216064, "3": 1.335917939847669e-07, "1": 0, "2": 0}, "score": 4.999867431950363}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9820264118615533, "4": 0.017965734036450895, "3": 7.864551876502804e-06, "2": 2.9500518425774133e-08, "1": 0}, "score": 4.9820184490766115}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9988041754686748, "4": 0.0011955451561620697, "3": 2.965440686624375e-07, "1": 0, "2": 0}, "score": 4.998803861776237}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7922623357542355, "4": 0.2075366974017882, "3": 0.00020006644931958313, "2": 6.913919172071206e-07, "1": 0}, "score": 4.792061052064011}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998815633641722, "4": 0.00011825810402021492, "3": 4.805161938580953e-08, "1": 0, "2": 0}, "score": 4.9998816457772985}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9968203448447296, "4": 0.0031789176555994726, "3": 6.782282186273003e-07, "1": 0, "2": 0}, "score": 4.9968197256994635}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8557029363893283, "4": 0.14424598609677064, "3": 5.07293459111621e-05, "2": 2.1831267778926646e-07, "1": 0}, "score": 4.855651881529003}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995296383847244, "4": 0.0004702077216211766, "3": 1.000275688953538e-07, "1": 0, "2": 0}, "score": 4.999529592197902}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9514996786270594, "5": 0.045047337395184454, "3": 0.0034486773439928882, "2": 4.28154342524904e-06, "1": 2.5862003286355725e-08}, "score": 4.041590019346239}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999838547864799, "4": 0.0001614316055576446, "3": 1.089766816951243e-08, "1": 0, "2": 0}, "score": 4.999838546597551}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999496229129681, "4": 5.033031391804733e-05, "3": 4.573957651111834e-09, "1": 0, "2": 0}, "score": 4.999949660536042}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8686946902753443, "5": 0.12946419792051375, "3": 0.0018401216415653442, "2": 9.660676250078803e-07, "1": 0}, "score": 4.127622147218748}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994832060386742, "4": 0.005166462813267745, "3": 1.4793954993652845e-06, "2": 1.2847648994120098e-08, "1": 0}, "score": 4.99483053993262}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987086910578313, "4": 0.0012911147325467619, "3": 1.6463729414089652e-07, "1": 0, "2": 0}, "score": 4.998708555954674}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999028985246534, "4": 9.698119153143957e-05, "3": 2.8529420040094968e-08, "1": 0, "2": 0}, "score": 4.999902961740725}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999798863910576, "4": 0.00020109723714341687, "3": 1.9332832897793515e-08, "1": 0, "2": 0}, "score": 4.999798864093265}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7602479871835146, "5": 0.23823547587642002, "3": 0.0015155892071777603, "2": 7.622189397670806e-07, "1": 0}, "score": 4.236718406145929}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9993672258860347, "4": 0.0006322571902497627, "3": 4.3646004534625705e-07, "1": 0, "2": 0}, "score": 4.999366869838716}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5295574082934613, "5": 0.470227950871106, "3": 0.00021436744128020812, "2": 1.6495898000231708e-07, "1": 0}, "score": 4.47001330447784}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872069438223975, "4": 0.012788290901977395, "3": 4.623636690844978e-06, "2": 4.946784373412936e-08, "1": 0}, "score": 4.987202312241534}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999017066011127, "4": 9.819600752486079e-05, "3": 2.3274883946095218e-08, "1": 0, "2": 0}, "score": 4.999901757435427}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7229397309354434, "3": 0.27097782175332746, "5": 0.00572127440688409, "2": 0.00036059042518565734, "1": 6.165477894440103e-07}, "score": 3.734020431221376}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9992135531115887, "4": 0.0007860081473527886, "3": 3.433903466407608e-07, "1": 0, "2": 0}, "score": 4.9992133049969425}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8334562813971393, "4": 0.16641265530022825, "3": 0.0001309096719101385, "2": 8.54999539158284e-08, "1": 0}, "score": 4.833325257500411}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8332730661743455, "5": 0.15623921761667753, "3": 0.010474725696588558, "2": 1.2767687408161671e-05, "1": 5.485585007680111e-08}, "score": 4.145738816457344}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9773187942825916, "4": 0.022676691232160526, "3": 4.418987325511631e-06, "1": 0, "2": 0}, "score": 4.977314468626767}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"4": 0.94638736878441, "5": 0.05163633952525238, "3": 0.00197369077337712, "2": 2.4061899381275565e-06, "1": 0}, "score": 4.049657846041723}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9645771829918376, "3": 0.03254783908789395, "5": 0.0028557122282446817, "2": 1.9210875634497034e-05, "1": 3.5432441851328636e-08}, "score": 3.970269344515459}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9972423221984361, "4": 0.0027570596812608516, "3": 5.660904306720196e-07, "1": 0, "2": 0}, "score": 4.99724180799437}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941482443108256, "4": 0.00585111522005646, "3": 6.830320863012086e-07, "1": 0, "2": 0}, "score": 4.99414751896487}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9449485948047284, "4": 0.05503912406502209, "3": 1.2112616047358663e-05, "2": 2.7158765178461964e-08, "1": 0}, "score": 4.944936561443072}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9941754409004387, "4": 0.0058233627034139975, "3": 1.2261553691160257e-06, "2": 3.798764327763068e-09, "1": 0}, "score": 4.994174173785059}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986219058450522, "4": 0.0013774772947681255, "3": 5.715007736466721e-07, "1": 0, "2": 0}, "score": 4.998621379641151}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8814513312112068, "4": 0.11848804613419635, "3": 6.042449432793376e-05, "2": 1.5379842815278683e-07, "1": 1.7506808054227467e-08}, "score": 4.881390570269371}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999713171213617, "4": 2.8638674453245317e-05, "3": 1.2247132610098148e-08, "1": 0, "2": 0}, "score": 4.999971336830366}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8766353197998759, "4": 0.12317201557391184, "3": 0.00019185417110824366, "2": 7.055332055999892e-07, "1": 6.25349647893993e-08}, "score": 4.876441904107146}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9887199196177169, "4": 0.011278031055111375, "3": 2.0171175924949933e-06, "1": 0, "2": 0}, "score": 4.9887179343463135}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999492653220473, "4": 5.067195278223038e-05, "3": 1.0127300903932642e-08, "1": 0, "2": 0}, "score": 4.999949307789949}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9858525491845126, "4": 0.014143374468373165, "3": 3.960021909544233e-06, "2": 5.5182778998305846e-09, "1": 0}, "score": 4.985848687364911}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982764488232155, "4": 0.001723259023302711, "3": 2.4225159550627784e-07, "1": 0, "2": 0}, "score": 4.998276256387488}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9592536699585014, "4": 0.04074202353204702, "3": 4.217500095004621e-06, "1": 0, "2": 0}, "score": 4.9592495378405905}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.50956576353355, "5": 0.4900876138918753, "3": 0.00034626388506361574, "2": 3.65375589538519e-07, "1": 1.4902304075653553e-08}, "score": 4.489740563976014}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5646532799554805, "4": 0.4351650041204069, "3": 0.00018158548925012149, "2": 1.0905843472196575e-07, "1": 0}, "score": 4.564471488415745}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.637286200477025, "5": 0.3623149564443915, "3": 0.00039856418747287063, "2": 1.3841138992543079e-07, "1": 0}, "score": 4.361916166276021}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977482016104197, "4": 0.002251756951839457, "3": 7.928736917465441e-08, "1": 0, "2": 0}, "score": 4.997748084558657}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973549561093238, "4": 0.002644787651186575, "3": 2.5437837831310046e-07, "1": 0, "2": 0}, "score": 4.997354703587134}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.929497027297037, "4": 0.07047806868798658, "3": 2.473433991290247e-05, "2": 6.889460251148178e-08, "1": 0}, "score": 4.929472248840561}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6223527032049716, "4": 0.37742417175244153, "3": 0.0002229555798151237, "2": 1.1555433323236482e-07, "1": 0}, "score": 4.622129550054523}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9656936119245757, "5": 0.027351177445966324, "3": 0.006949483074092647, "2": 5.690690294779058e-06, "1": 5.049164297514749e-08}, "score": 4.020390161238507}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.949901166559608, "4": 0.05007343755569628, "3": 2.52868009486205e-05, "2": 6.438603984035432e-08, "1": 0}, "score": 4.949875793443851}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6084285337755061, "3": 0.36501588711661465, "2": 0.023878531197303883, "5": 0.002599643392739985, "1": 7.730499392457828e-05}, "score": 3.589594738054608}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"5": 0.97846665734496, "4": 0.021523545576225298, "3": 9.689846240896815e-06, "2": 1.064423833073639e-07, "1": 0}, "score": 4.9784567553871195}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7145646734737336, "5": 0.284411541485669, "3": 0.0010177713430327895, "2": 5.471870739994821e-06, "1": 2.843391844397969e-07}, "score": 4.283382046350978}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9769349993621188, "4": 0.0230532228351713, "3": 1.1650913138931897e-05, "2": 7.103692675264515e-08, "1": 0}, "score": 4.976923260938873}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986069252307592, "4": 0.0013922237361399406, "3": 7.71658301146359e-07, "1": 0, "2": 0}, "score": 4.998606232836628}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9983806438743391, "4": 0.001618817717802358, "3": 5.587045704536006e-07, "1": 0, "2": 0}, "score": 4.998380064905937}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8566620062079177, "5": 0.14157999301105834, "3": 0.0017566810803461533, "2": 1.1736940210000283e-06, "1": 0}, "score": 4.139820984957465}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9563129174305977, "4": 0.043667747187645545, "3": 1.9231173034307968e-05, "2": 2.4248623113491278e-08, "1": 0}, "score": 4.956293714225657}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6682854542513333, "5": 0.33062909196251195, "3": 0.0010836720051777776, "2": 1.6882163509660457e-06, "1": 0}, "score": 4.329542074358113}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9847567181165381, "4": 0.015240995642269895, "3": 2.257681852685942e-06, "1": 0, "2": 0}, "score": 4.9847544885586235}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9677231603334121, "4": 0.03227220324228249, "3": 4.580446845855619e-06, "1": 0, "2": 0}, "score": 4.967718634056996}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9497429594480495, "5": 0.04603134046618986, "3": 0.00422029604732627, "2": 5.261344265932724e-06, "1": 4.740083463817921e-08}, "score": 4.041800383511125}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8409230259595368, "5": 0.15054217522474084, "3": 0.00839043006986263, "2": 0.00014228528023455477, "1": 1.650533481810144e-06}, "score": 4.141862284410706}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9858847604710689, "4": 0.014113619864338218, "3": 1.4932001342476197e-06, "1": 0, "2": 0}, "score": 4.985883391950145}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9883285179067705, "4": 0.011670892003507136, "3": 5.246025020928211e-07, "1": 0, "2": 0}, "score": 4.988328058027126}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995080912268116, "4": 0.0004918484093623805, "3": 5.730877979040647e-08, "1": 0, "2": 0}, "score": 4.999508036971575}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8905099658660458, "5": 0.0749708205861643, "3": 0.03434411842037259, "2": 0.00017369546383461194, "1": 1.2897553612718695e-06}, "score": 4.040275446398642}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6707399721454077, "4": 0.31845761173533665, "3": 0.010733259435659812, "2": 6.545687690532429e-05, "1": 2.686087188607689e-06}, "score": 4.659868409615847}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6621290516330354, "5": 0.3307639169255062, "3": 0.0070891310917746, "2": 1.742511502834034e-05, "1": 2.7037012049804443e-07}, "score": 4.3236391907955065}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960421288001053, "4": 0.00395590610633121, "3": 1.9268384635322647e-06, "2": 1.5438012881761996e-08, "1": 0}, "score": 4.996040193812352}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8169448577287426, "5": 0.1753506141462053, "3": 0.007686536400364904, "2": 1.7717955456551e-05, "1": 2.3624793768176864e-07}, "score": 4.167627939380731}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8988533261913318, "5": 0.06673671685043246, "3": 0.03396888909078886, "2": 0.000439104382414017, "1": 1.7857715414738337e-06}, "score": 4.031884267346455}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6200255451108976, "3": 0.3547241974670808, "2": 0.022803361948737565, "5": 0.0024084822539820723, "1": 3.82004600206065e-05}, "score": 3.6019628748232724}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8265895658151199, "5": 0.14625027683252453, "3": 0.02705430058013543, "2": 0.000104839913979766, "1": 7.437870992396365e-07}, "score": 4.118984097554255}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6392797672483779, "5": 0.35857881375293316, "3": 0.0021312161494811037, "2": 9.66190233537497e-06, "1": 1.9708750874729758e-07}, "score": 4.356427805097293}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.8548900968529708, "4": 0.10188204056180034, "2": 0.04305720063319586, "5": 0.0001365334388609548, "1": 3.402210831862952e-05}, "score": 3.059029868870754}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.999186891152303, "4": 0.0008127131822676062, "3": 3.834582836584186e-07, "1": 0, "2": 0}, "score": 4.999186519891234}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999837140256179, "4": 1.615899011027752e-05, "3": 3.0610522945373e-08, "1": 0, "2": 0}, "score": 4.99998377978728}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9859206788789481, "4": 0.01407360249164507, "3": 5.6207441038661274e-06, "2": 6.132434626646834e-09, "1": 0}, "score": 4.985915136330517}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9744042659583642, "4": 0.025581728827247102, "3": 1.3922372212677773e-05, "2": 3.1377115985488434e-08, "1": 0}, "score": 4.974390330978977}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999909096527971, "4": 9.07535470166695e-05, "3": 1.0502703959385307e-07, "1": 0, "2": 0}, "score": 4.999909036394819}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9542587899777082, "5": 0.026072050513163903, "3": 0.019645450385877068, "2": 2.362126954286413e-05, "1": 8.376186538814614e-08}, "score": 4.0063791063287075}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5590521044854972, "4": 0.43829646361586344, "3": 0.00263403707555213, "2": 1.677976268088332e-05, "1": 2.7740120088541883e-07}, "score": 4.556383863549114}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5967696117729447, "5": 0.40140483393673415, "3": 0.0018151548465515442, "2": 1.0156618459531518e-05, "1": 1.5817544635679183e-07}, "score": 4.399568925150379}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9612353027558543, "4": 0.03875932527022587, "3": 5.231486995162722e-06, "2": 3.0006554374420434e-08, "1": 0}, "score": 4.96123011745281}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7091563321998952, "5": 0.2866108519097844, "3": 0.004212375662751675, "2": 1.9981913870840792e-05, "1": 3.811099198063813e-07}, "score": 4.282357390888588}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8717920485035072, "5": 0.12441690694421566, "3": 0.0037855219575570467, "2": 5.418687123452444e-06, "1": 8.538631456404073e-08}, "score": 4.1206202936875105}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9340072018713429, "4": 0.06590398954027235, "3": 8.828547146165568e-05, "2": 4.404702194933812e-07, "1": 3.506076983676528e-08}, "score": 4.933917974718491}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9269001187362221, "4": 0.0730790461275032, "3": 2.0653474418464217e-05, "2": 4.8502814973332615e-08, "1": 0}, "score": 4.926879491678559}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974618096661704, "4": 0.002537541449422142, "3": 6.546160214520708e-07, "1": 0, "2": 0}, "score": 4.997461149333087}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996285027721901, "4": 0.0003712044756047684, "3": 2.4951794512314666e-07, "1": 0, "2": 0}, "score": 4.999628296472435}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9182663489278174, "3": 0.07801415456296866, "5": 0.0036004947946721697, "2": 0.00011867439399085117, "1": 1.9616082077410755e-07}, "score": 3.9253483931699753}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8328873667026284, "5": 0.16549188807811865, "3": 0.0016181754983566987, "2": 2.477285880767188e-06, "1": 3.918867636971276e-08}, "score": 4.163868649167377}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.940412180437058, "5": 0.0587458304229924, "3": 0.0008415585235915358, "2": 3.5719249457247323e-07, "1": 0}, "score": 4.057903561765915}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9918759846362528, "4": 0.008123148935866261, "3": 8.208002975646011e-07, "1": 0, "2": 0}, "score": 4.991875209092823}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.703131675211699, "4": 0.2967648216949931, "3": 0.00010319914395096542, "2": 1.0992033069178037e-07, "1": 0}, "score": 4.703028392635002}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9966780997602055, "4": 0.0033199916869088254, "3": 1.9256692274839407e-06, "2": 1.5351847681911658e-08, "1": 0}, "score": 4.996676111027015}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9842967177064966, "4": 0.015700140776688774, "3": 3.062055914862051e-06, "2": 4.950832958885793e-09, "1": 0}, "score": 4.984293719088708}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.871607710130715, "4": 0.12834407956475213, "3": 4.811223727540635e-05, "2": 9.196387500488964e-08, "1": 0}, "score": 4.87155941928515}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998644075534868, "4": 0.00013547614294129743, "3": 5.690793786546045e-08, "1": 0, "2": 0}, "score": 4.999864410033129}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9886183081609573, "4": 0.01137997895025084, "3": 1.5928128765601134e-06, "2": 3.611137562405263e-09, "1": 0}, "score": 4.988616823264844}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5536696886080392, "4": 0.44606034206673995, "3": 0.0002692573349889631, "2": 6.597512281673175e-07, "1": 2.888339426142907e-08}, "score": 4.5533990380453835}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9410925475690879, "3": 0.038239785504752904, "5": 0.019330434654664233, "2": 0.0013337261999081624, "1": 3.139182946578915e-06}, "score": 3.9784137712815135}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7436541681279373, "5": 0.2555087815168621, "3": 0.0008360253687042257, "2": 9.123921046137696e-07, "1": 0}, "score": 4.254670960038471}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990568221720842, "4": 0.0009429593343138134, "3": 1.7888423002173808e-07, "2": 2.5534766862450352e-09, "1": 0}, "score": 4.9990566752018415}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9073852927552026, "4": 0.09259698474585093, "3": 1.7595700069547627e-05, "2": 2.720622580353213e-08, "1": 0}, "score": 4.907367733009838}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8684799320637516, "3": 0.1301364582770714, "1": 0.0013250169860046115, "4": 5.8520174495918944e-05, "5": 6.658849646963657e-08}, "score": 2.1289286821675395}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9831503002310217, "4": 0.01684414770033486, "3": 5.5745609337363855e-06, "2": 1.525657926069516e-08, "1": 0}, "score": 4.9831446580443295}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7731101374605922, "5": 0.2252644125177731, "3": 0.0016225078032475965, "2": 2.8494231148918037e-06, "1": 4.376475604415427e-08}, "score": 4.223636085539021}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9832381034059625, "4": 0.016757422240892106, "3": 4.4872388537214605e-06, "2": 1.0990517295328472e-08, "1": 0}, "score": 4.9832335707101665}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9839102002528131, "4": 0.016078713896354617, "3": 1.103249002444789e-05, "2": 3.342422167312174e-08, "1": 0}, "score": 4.983899120529935}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"5": 0.967290654760227, "4": 0.03270476804286544, "3": 4.489433650104911e-06, "2": 6.853461389251889e-09, "1": 0}, "score": 4.9672862298825855}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9325018066870854, "4": 0.06748220132152366, "3": 1.5820705518515213e-05, "2": 1.963468876644094e-08, "1": 0}, "score": 4.932486088124807}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9588258490421612, "4": 0.0411642219160635, "3": 9.853902385207523e-06, "2": 1.9120782584673938e-08, "1": 0}, "score": 4.958816010609748}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999399679479958, "4": 5.998608135918476e-05, "3": 6.5194879458795565e-09, "1": 0, "2": 0}, "score": 4.999940000877298}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997183236782262, "4": 0.0002815242411169357, "3": 4.931369526764248e-08, "1": 0, "2": 0}, "score": 4.9997183771025515}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9552495631214106, "5": 0.03628318021689001, "3": 0.008447134563781876, "2": 1.989922045732207e-05, "1": 1.0063527445853157e-07}, "score": 4.027795948704208}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998957470247192, "4": 0.00010421734330798142, "3": 1.2291547572726469e-08, "1": 0, "2": 0}, "score": 4.999895758071164}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5464254468369784, "5": 0.4527417338649385, "3": 0.0008314883252659301, "2": 1.2586812652067646e-06, "1": 0}, "score": 4.451907760846256}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.960247428219761, "4": 0.03975126557594793, "3": 1.2494338865450767e-06, "1": 0, "2": 0}, "score": 4.960246233299442}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9886776220956074, "4": 0.01131933447382897, "3": 3.0092550546010473e-06, "2": 1.2306540105309693e-08, "1": 0}, "score": 4.988674609848767}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6957612076321165, "4": 0.29993115919741614, "2": 0.004109746217283677, "5": 0.00019627319837648197, "1": 1.6319303174089744e-06}, "score": 3.296210690132471}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8571397798574597, "5": 0.13922964316245237, "3": 0.0036244562569829643, "2": 6.001824809855309e-06, "1": 0}, "score": 4.135593199377651}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.545332324733479, "5": 0.4539679854759486, "3": 0.0006993478500188475, "2": 3.6843298527364755e-07, "1": 0}, "score": 4.453267888751792}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935922035523722, "4": 0.006407208463627196, "3": 6.06456399410312e-07, "2": 1.7541226843061224e-09, "1": 0}, "score": 4.993591573490827}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.80460194670506, "4": 0.19533375878410172, "3": 6.41459244812701e-05, "2": 8.442333436814929e-08, "1": 0}, "score": 4.80453768355548}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9357731574766931, "5": 0.05394208003503777, "3": 0.010268999289035866, "2": 1.5622209035883828e-05, "1": 1.5701193741470666e-07}, "score": 4.043641364592908}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8295085848316073, "4": 0.17047108262760446, "3": 2.0323087558909713e-05, "2": 3.575431055893065e-08, "1": 0}, "score": 4.829488168418992}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8354381175977721, "4": 0.1645420365638957, "3": 1.9780657335326958e-05, "2": 1.219348553941761e-08, "1": 0}, "score": 4.835418356820206}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9656676032487731, "3": 0.027183965042827288, "5": 0.007105131567580126, "2": 4.317214769171534e-05, "1": 7.532709044313745e-08}, "score": 3.979834595186066}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8385611521220907, "4": 0.16140881641659902, "3": 2.9982400453484116e-05, "2": 4.043888560194995e-08, "1": 0}, "score": 4.838531096073657}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6289181738579998, "5": 0.37063908743864793, "3": 0.00044227398162300166, "2": 3.4673882711533103e-07, "1": 0}, "score": 4.370196163656189}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9891178259545972, "4": 0.01088051178062759, "3": 1.6125722227131821e-06, "2": 1.1979140397065196e-08, "1": 0}, "score": 4.989116226727041}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8156389623724806, "4": 0.18426998261143, "3": 9.057783696059058e-05, "2": 1.0752236118357347e-07, "1": 0}, "score": 4.815548470963808}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939153664172541, "4": 0.006084560998558616, "3": 9.844970778717631e-08, "1": 0, "2": 0}, "score": 4.993915242259412}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9980639607464319, "4": 0.001935988945718886, "3": 7.134489815964227e-08, "1": 0, "2": 0}, "score": 4.998063868405215}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7662687670192447, "2": 0.21976633735337456, "4": 0.013839478640309951, "1": 0.00011197678331359546, "5": 1.3394545314009577e-05}, "score": 2.793875967399633}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.969041248389444, "5": 0.01989676745288383, "3": 0.011007928423917674, "2": 5.351797388591542e-05, "1": 3.425791880440783e-07}, "score": 4.008780777057469}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7781506780266049, "4": 0.22168793150367666, "3": 0.00016098216105810796, "2": 3.216879051764181e-07, "1": 9.629370325830368e-09}, "score": 4.777989083500082}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9923188013476789, "4": 0.007680010228404042, "3": 1.1969115825376379e-06, "1": 0, "2": 0}, "score": 4.992317596013637}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5654793502544128, "3": 0.42829948362504694, "2": 0.004813887544450239, "5": 0.0014024129362982707, "1": 4.812051776685618e-06}, "score": 3.5634606946737453}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7708140614024931, "5": 0.22538200869872033, "3": 0.0037929583389612965, "2": 1.079261990012585e-05, "1": 1.0864577688308387e-07}, "score": 4.221567154757503}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5651770127501513, "5": 0.43457779735721097, "3": 0.0002451402652541882, "2": 4.7380314519707255e-08, "1": 0}, "score": 4.4343325633073025}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5118641608416158, "4": 0.4878934876324957, "3": 0.0002421994494425531, "2": 1.1492041403858118e-07, "1": 0}, "score": 4.511621750561179}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5388294540085022, "5": 0.46076482829424215, "3": 0.0004052756925898875, "2": 3.8186984740323516e-07, "1": 0}, "score": 4.460358816545551}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9407966054471024, "4": 0.05918990945591305, "3": 1.3369240162382325e-05, "2": 2.5910280927391636e-08, "1": 0}, "score": 4.940783269006579}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6132112228795821, "5": 0.38532786873578845, "3": 0.0014561864224598338, "2": 4.6373290186695275e-06, "1": 1.1210969783939488e-07}, "score": 4.383862060778994}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8624403516287489, "5": 0.13522665262520137, "3": 0.002327994759940835, "2": 4.9402333057254445e-06, "1": 1.0136367952940705e-07}, "score": 4.1328884679108935}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9975151885674575, "4": 0.00248389422089101, "3": 8.505054645740311e-07, "2": 1.286404019375687e-08, "1": 0}, "score": 4.997514366042228}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996865131172844, "4": 0.0003134395623653609, "3": 1.8732160077333668e-08, "1": 0, "2": 0}, "score": 4.999686522964353}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986005046083137, "4": 0.0013992166985160681, "3": 2.550982683357121e-07, "2": 2.7747560597733185e-09, "1": 0}, "score": 4.998600264751537}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7467721652772612, "5": 0.25003906833232387, "3": 0.003182164669790453, "2": 6.360280994901081e-06, "1": 5.744602647325789e-08}, "score": 4.246844056180191}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9211971636623676, "4": 0.07866139323656518, "3": 0.00014093975900202331, "2": 4.464300999272695e-07, "1": 0}, "score": 4.921055383462238}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9787439569001414, "4": 0.021248524952945675, "3": 7.52107859576325e-06, "2": 1.8530088882121786e-08, "1": 0}, "score": 4.9787363777559515}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9918157042132306, "4": 0.00817940393176449, "3": 4.884073268929624e-06, "2": 1.71588973833598e-08, "1": 0}, "score": 4.991810776521797}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5744535717589674, "5": 0.42482392075978387, "3": 0.0007186721390492142, "2": 3.605186697788878e-06, "1": 9.498888045866757e-08}, "score": 4.424097810604565}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9483813345249571, "4": 0.05159622335333708, "3": 2.2282275860157147e-05, "2": 1.237369370823317e-07, "1": 1.666001999547255e-08}, "score": 4.948358773239686}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986391446046303, "4": 0.0013607904974070508, "3": 6.283648253889527e-08, "1": 0, "2": 0}, "score": 4.998639083826822}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.603701324024071, "4": 0.39612395461603744, "3": 0.0001744069842475969, "2": 2.524299632432859e-07, "1": 0}, "score": 4.603526449565753}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999927452391705, "4": 7.250768512480375e-05, "3": 1.1001766347430705e-08, "1": 0, "2": 0}, "score": 4.999927470309245}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9608981490190701, "4": 0.03909574271062903, "3": 6.0338456355247015e-06, "2": 1.6113458217615986e-08, "1": 0}, "score": 4.9608921389772975}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.961594185415848, "5": 0.03559617110993907, "3": 0.0028077952840972714, "2": 1.6968533375335616e-06, "1": 0}, "score": 4.032784987080742}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.997300890763142, "4": 0.0026989094364294223, "3": 1.7779635760279225e-07, "1": 0, "2": 0}, "score": 4.997300734911461}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.923802763076659, "4": 0.07615618360370939, "3": 4.0893599442917595e-05, "2": 9.763400425050704e-08, "1": 1.0265531601935942e-08}, "score": 4.9237616912825475}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999943901441583, "4": 5.606919527952959e-05, "3": 4.257183693940568e-09, "1": 0, "2": 0}, "score": 4.999943922288945}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999365112594953, "4": 6.342249174807395e-05, "3": 2.0441207459389895e-08, "1": 0, "2": 0}, "score": 4.999936536622931}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.831348082489902, "4": 0.16852211356940908, "3": 0.00012960852459672015, "2": 2.4473594087119826e-07, "1": 1.1374520805338207e-08}, "score": 4.831217899919615}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8702229202347171, "5": 0.1276189382751784, "3": 0.0021542966267563825, "2": 3.715155586694705e-06, "1": 5.2006662581769606e-08}, "score": 4.1254570650654125}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9090290655621147, "3": 0.08261186208406798, "5": 0.008189044947039219, "2": 0.00016963050269189501, "1": 3.4038534277571477e-07}, "score": 3.9252368964760422}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.823911605257496, "4": 0.17590707611359935, "3": 0.00018005449552100514, "2": 1.0571552329853022e-06, "1": 0}, "score": 4.823729606945539}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8499714655520693, "4": 0.14995993808369207, "3": 6.840032376093287e-05, "2": 2.2721616587768215e-07, "1": 0}, "score": 4.849902584299678}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7385703506530471, "4": 0.2611788910816659, "3": 0.00024974978532388596, "2": 8.939812814209376e-07, "1": 6.867442347339645e-08}, "score": 4.738318640714795}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.845924488882158, "4": 0.15403491214828371, "3": 4.0543098061135324e-05, "2": 5.952395502240912e-08, "1": 0}, "score": 4.845883823646631}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6358656754951245, "5": 0.3635582671795782, "3": 0.0005751564886616412, "2": 7.574926519545268e-07, "1": 0}, "score": 4.362981647736848}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997071254161366, "4": 0.0002927896865584621, "3": 1.3845355548643941e-08, "1": 0, "2": 0}, "score": 4.9997071826019255}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8052060351709437, "5": 0.19315621757343182, "3": 0.0016267414101143783, "2": 1.0513031238065324e-05, "1": 2.1410548988358438e-07}, "score": 4.191507861159294}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9137657786964407, "5": 0.0845423573329945, "3": 0.0016898503572052208, "2": 1.9921442236340677e-06, "1": 0}, "score": 4.082848524466028}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.986681511999392, "4": 0.01331789046381203, "3": 5.274678084992979e-07, "1": 0, "2": 0}, "score": 4.986681053667325}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9588119298683433, "4": 0.041175794805337486, "3": 1.2214643977693047e-05, "2": 1.3103348876264349e-08, "1": 0}, "score": 4.9587997346363935}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998446263017435, "4": 0.00015521706521153688, "3": 5.362384491375816e-08, "1": 0, "2": 0}, "score": 4.999844675671099}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989366754306424, "4": 0.0010628763586296777, "3": 4.0074360626779686e-07, "2": 3.850233658379996e-09, "1": 0}, "score": 4.998936310557062}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9950141422579298, "4": 0.004985218724506448, "3": 6.816803390859242e-07, "1": 0, "2": 0}, "score": 4.995013418127557}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999607083559369, "4": 3.914021902790973e-05, "3": 3.4470325964257144e-08, "1": 0, "2": 0}, "score": 4.999960790835734}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9667220192712129, "4": 0.03327310719551139, "3": 4.7744250483681745e-06, "2": 1.4239230077721839e-08, "1": 0}, "score": 4.966717298412031}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999850252451228, "4": 1.48233784276092e-05, "3": 1.5455251321398267e-08, "1": 0, "2": 0}, "score": 4.999985145709051}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998437919917416, "4": 0.00015605547577313985, "3": 4.22628663714986e-08, "1": 0, "2": 0}, "score": 4.999843859981278}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8920232693742037, "5": 0.10571113989838335, "3": 0.0022615456127583616, "2": 3.756138961868717e-06, "1": 0}, "score": 4.103442111899957}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.520813977463678, "4": 0.47828231676081395, "3": 0.0008911529358935329, "2": 1.2180320285624169e-05, "1": 1.6541357234744551e-07}, "score": 4.51989807532038}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.76538840120904, "5": 0.23348636443553833, "3": 0.0011236432175592587, "2": 1.4341080069055972e-06, "1": 0}, "score": 4.2323598894894054}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.86463179776155, "4": 0.13534547436713165, "3": 2.2652575588125152e-05, "2": 5.527859908363265e-08, "1": 0}, "score": 4.864609051935758}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9964075892032748, "4": 0.0035919286224327155, "3": 5.13359221492281e-07, "1": 0, "2": 0}, "score": 4.9964070447711695}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4995109146405645, "5": 0.4992261397582761, "3": 0.001261717993270582, "2": 1.0078461791593447e-06, "1": 0}, "score": 4.4979625155057406}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5287652010522007, "4": 0.46913598775250587, "3": 0.002092380847236921, "2": 6.225940765774461e-06, "1": 1.2950776450974447e-07}, "score": 4.526660019246724}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5879781450832683, "5": 0.41090337066464533, "3": 0.0011167045466672952, "2": 1.6043963147784764e-06, "1": 0}, "score": 4.409783529164132}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.985877580298505, "4": 0.014116104080038907, "3": 6.287638468235002e-06, "2": 2.161703879758861e-08, "1": 0}, "score": 4.985871255701965}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6416258713925757, "5": 0.3379705897023111, "3": 0.02026039264587877, "2": 0.0001405848270681889, "1": 1.650195157125839e-06}, "score": 4.317424366065656}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5303329087022112, "5": 0.46932048829331946, "3": 0.0003459676445985813, "2": 6.242143612030995e-07, "1": 2.3667974252353345e-08}, "score": 4.468973195343376}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6316896598362745, "4": 0.36813397300025136, "3": 0.0001761578658327492, "2": 2.1010488048963973e-07, "1": 1.052474169207287e-08}, "score": 4.631513043030162}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9833484072766445, "5": 0.01372144968629311, "3": 0.0029284558749666776, "2": 1.5861886417338733e-06, "1": 0}, "score": 4.010789822523529}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998186442669394, "4": 0.00018129808551899714, "3": 3.960442430709892e-08, "1": 0, "2": 0}, "score": 4.999818622702358}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995688277314909, "4": 0.00043083300600774637, "3": 2.2096666144460033e-07, "1": 0, "2": 0}, "score": 4.999568725009651}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8301300862921175, "5": 0.1638997038710502, "3": 0.005961375714262953, "2": 8.793462590508009e-06, "1": 4.092908098619277e-08}, "score": 4.157920618401866}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999643625146609, "4": 0.00035626953243382027, "3": 6.225375388788077e-08, "1": 0, "2": 0}, "score": 4.999643605944709}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5649909870990562, "5": 0.4335176363358728, "3": 0.001488442511531499, "2": 2.926981121655877e-06, "1": 5.860270388767661e-08}, "score": 4.432023141791711}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996473191865045, "4": 0.0003525926970246076, "3": 4.717578998462488e-08, "1": 0, "2": 0}, "score": 4.999647312936957}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.996171403336803, "4": 0.0038274289256400584, "3": 1.1670784304734685e-06, "1": 0, "2": 0}, "score": 4.996170236914975}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7453620764565706, "4": 0.20715373090012268, "2": 0.04262906420525114, "5": 0.004658306075683729, "1": 0.0001962482732630662}, "score": 3.173448881874827}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6216012431569227, "5": 0.37123028301481614, "3": 0.007154880984531845, "2": 1.3310225281073537e-05, "1": 1.6917519536816038e-07}, "score": 4.36404831535296}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9584523891293448, "5": 0.02907455168374457, "3": 0.012465352290890672, "2": 7.646312901290477e-06, "1": 2.9545747856900372e-08}, "score": 4.016593818644837}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9339774598195619, "5": 0.0509319373165465, "3": 0.015039059434736633, "2": 5.1192680250322916e-05, "1": 2.4533358035606926e-07}, "score": 4.0357897602933575}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6073373659370163, "5": 0.392094330151032, "3": 0.0005668495122261625, "2": 1.4126742764205748e-06, "1": 2.8823292768618343e-08}, "score": 4.3915245738718856}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8737674624475564, "4": 0.12619087971359874, "3": 4.147735260701662e-05, "2": 1.4033842639356153e-07, "1": 0}, "score": 4.873725739496272}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998936015807134, "4": 0.00010633149844495328, "3": 2.6948747921074662e-08, "1": 0, "2": 0}, "score": 4.999893614599807}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8529321734081311, "4": 0.14702019804139482, "3": 4.738139106090975e-05, "2": 4.138964947726328e-08, "1": 0}, "score": 4.852884884735692}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993084148952952, "4": 0.0006915490338317144, "3": 3.914868515013086e-08, "1": 0, "2": 0}, "score": 4.999308372670927}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996131350315575, "4": 0.0003867078730411854, "3": 6.982833248568767e-08, "1": 0, "2": 0}, "score": 4.9996131524365355}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9579178464115576, "5": 0.036173820948071374, "3": 0.005902466290945943, "2": 5.694305030673431e-06, "1": 5.791224438658268e-08}, "score": 4.030259795763947}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9713710955201185, "5": 0.015343305866046285, "3": 0.013274474477765927, "2": 1.1028607271363926e-05, "1": 4.906205065843089e-08}, "score": 4.002046627082686}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7746610268647651, "5": 0.22421790719784176, "3": 0.001120209564519637, "2": 8.194708580840552e-07, "1": 1.729625210919051e-08}, "score": 4.2230960111768185}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995763270347484, "4": 0.00042350086558074634, "3": 1.3321559581445652e-07, "1": 0, "2": 0}, "score": 4.99957623268675}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8672866881674748, "5": 0.117045409979542, "3": 0.015632972085536108, "2": 3.473809967501373e-05, "1": 1.3068120882349657e-07}, "score": 4.101342575831565}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"4": 0.957104938438443, "3": 0.02865614997626177, "5": 0.014173248494515503, "2": 6.510338585765514e-05, "1": 3.9341531575016407e-07}, "score": 3.985385709070387}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5936576040345742, "4": 0.40563310914289114, "3": 0.0007058675106857034, "2": 3.0105974816943892e-06, "1": 1.1724524321944056e-07}, "score": 4.5929455364185126}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9465896267501936, "4": 0.05337808556093829, "3": 3.2169186646950286e-05, "2": 5.943990706782637e-08, "1": 0}, "score": 4.946557394589603}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995394085348308, "4": 0.00046023469135056356, "3": 2.6505751414482426e-07, "1": 0, "2": 0}, "score": 4.999539235151362}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9037544731299756, "4": 0.09617457974923103, "3": 7.071739328302165e-05, "2": 1.6488146749858125e-07, "1": 0}, "score": 4.9036834845740565}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9753832815006931, "4": 0.024610930634389103, "3": 5.729507397247106e-06, "2": 1.2909259401497787e-08, "1": 0}, "score": 4.975377570503991}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9985266952805757, "4": 0.0014728588071992942, "3": 4.487077733301914e-07, "1": 0, "2": 0}, "score": 4.998526243781375}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9537502883982784, "4": 0.046236409816919385, "3": 1.3268191549899474e-05, "2": 1.5155383827007833e-08, "1": 0}, "score": 4.9537370074808385}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999809723900273, "4": 1.898874733064788e-05, "1": 0, "2": 0, "3": 0}, "score": 4.999981011251931}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929100774326863, "4": 0.0070883832278949305, "3": 1.4846507478549319e-06, "2": 6.9075349460356264e-09, "1": 0}, "score": 4.9929086264091715}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6603607317601593, "5": 0.33923092799175014, "3": 0.0004073879632073166, "2": 8.488800028701282e-07, "1": 0}, "score": 4.3388218773043725}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.993282662855533, "4": 0.006716342791822049, "3": 9.171892559478819e-07, "1": 0, "2": 0}, "score": 4.9932818223112685}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5131941219643673, "5": 0.4862885193571771, "3": 0.0005168171092034746, "2": 4.514076614799449e-07, "1": 0}, "score": 4.485770843230522}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981190669758446, "4": 0.0018808211793160576, "3": 1.1526868988706646e-07, "1": 0, "2": 0}, "score": 4.998118948289745}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9142491698180839, "4": 0.08569558256838194, "3": 5.4850623716226634e-05, "2": 2.86219739844365e-07, "1": 0}, "score": 4.914193848020211}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8395272610765974, "4": 0.1602690842160946, "3": 0.0002029043240748604, "2": 7.067647290868929e-07, "1": 0}, "score": 4.839322979833077}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9717521079707839, "4": 0.028241419557602076, "3": 6.312864641759018e-06, "2": 2.4329919228207383e-08, "1": 0}, "score": 4.971745877901222}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9353345090366991, "5": 0.06290156090021119, "3": 0.0017618362322979807, "2": 1.9795084532752966e-06, "1": 2.0537425111847902e-08}, "score": 4.061135709772339}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999678603234905, "4": 3.208560727089901e-05, "3": 4.6985306724034694e-09, "1": 0, "2": 0}, "score": 4.999967904994084}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9903746966449465, "4": 0.009623820035863768, "3": 1.4479279840639914e-06, "2": 5.4231825905352616e-09, "1": 0}, "score": 4.990373267550127}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5593162071573824, "5": 0.43999645892497447, "3": 0.0006857280756519874, "2": 1.4015076610986471e-06, "1": 6.085067041935159e-08}, "score": 4.439307808315481}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986590027414597, "4": 0.001340934526847748, "3": 6.744772389044369e-08, "1": 0, "2": 0}, "score": 4.998658930584028}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6951028421833075, "5": 0.3046797359880542, "3": 0.0002173594767816757, "2": 1.0422164538262618e-07, "1": 0}, "score": 4.304462155320216}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998192401790255, "4": 0.00018065435378441692, "3": 5.636023913091361e-09, "1": 0, "2": 0}, "score": 4.999819334356131}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987763557638922, "4": 0.001223530679746921, "3": 4.199400361194419e-08, "1": 0, "2": 0}, "score": 4.998776385244681}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9810266869148413, "5": 0.01156764849506886, "3": 0.007396757873349138, "2": 8.843940700905293e-06, "1": 4.577416444843758e-08}, "score": 4.004153065488434}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997581089603562, "4": 0.00024166985470064098, "3": 1.5577066616863667e-07, "1": 0, "2": 0}, "score": 4.999758018588137}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9394951457368764, "4": 0.0604866439181657, "3": 1.809829179704576e-05, "2": 7.307175013099864e-08, "1": 0}, "score": 4.9394769379237164}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999068318704197, "4": 9.30778796180212e-05, "3": 5.284525030014799e-08, "1": 0, "2": 0}, "score": 4.999906816426396}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9985969445040008, "4": 0.0014029852375177904, "3": 9.135516636516893e-08, "1": 0, "2": 0}, "score": 4.99859683208175}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7905552201975359, "5": 0.20899060085797644, "3": 0.00045380298856353106, "2": 3.4952735827847953e-07, "1": 0}, "score": 4.208536104326006}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997152252560272, "4": 0.00028452626181322096, "3": 1.4091739067522568e-07, "1": 0, "2": 0}, "score": 4.99971519187277}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9792374230209121, "4": 0.02075183920184281, "3": 1.0692900942535879e-05, "2": 2.5819805099186337e-08, "1": 0}, "score": 4.979226697140991}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9882208231453431, "4": 0.011777626578066837, "3": 1.4196658939299687e-06, "1": 0, "2": 0}, "score": 4.98821953255149}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993680597883768, "4": 0.0006317896825351801, "3": 8.546080390297239e-08, "1": 0, "2": 0}, "score": 4.999368039354737}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8763286299951686, "5": 0.11822259892809348, "3": 0.005440109987653585, "2": 8.492815391078666e-06, "1": 6.112083686615663e-08}, "score": 4.112765332030275}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7940764561424264, "5": 0.20379960426022212, "3": 0.002114192364854723, "2": 9.575258747740214e-06, "1": 1.7092208970985128e-07}, "score": 4.201665748823686}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999870009379513, "4": 0.0001299346404119303, "3": 2.6994680739477867e-08, "1": 0, "2": 0}, "score": 4.9998700113664585}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999088581436714, "4": 9.103277058090919e-05, "3": 5.908918052126637e-08, "1": 0, "2": 0}, "score": 4.999908849046501}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9412112136449489, "5": 0.05029863698285279, "3": 0.008453446930676522, "2": 3.6559590946279954e-05, "1": 1.7948916373584614e-07}, "score": 4.041771530872342}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8883453001969543, "4": 0.11154992839647905, "3": 0.0001040788263755603, "2": 5.515981747736587e-07, "1": 3.7213657721379155e-08}, "score": 4.888240098704473}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6810289382338468, "5": 0.3181403313467756, "3": 0.0008297799606263328, "2": 9.611147771387147e-07, "1": 2.1491807950061895e-08}, "score": 4.317308554480389}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9774070550414433, "4": 0.022563232004558013, "3": 2.950000869124703e-05, "2": 1.3950254390125103e-07, "1": 0}, "score": 4.977377347808957}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8974625863560274, "4": 0.10250786004272838, "3": 2.952293910531233e-05, "2": 4.714098709546201e-08, "1": 0}, "score": 4.897432954346288}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999888397127765, "4": 1.1093247146004685e-05, "3": 6.6463965588057134e-09, "1": 0, "2": 0}, "score": 4.99998889345939}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9834134274394957, "4": 0.016584213998806854, "3": 2.388184748638408e-06, "1": 0, "2": 0}, "score": 4.983411010123112}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8284779888001047, "4": 0.17131995309858095, "3": 0.0002014128049517644, "2": 6.263879057545705e-07, "1": 3.00838004830397e-08}, "score": 4.82827522371168}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.576548162402596, "5": 0.4232671665084507, "3": 0.00018449116164394598, "2": 1.4424869188320186e-07, "1": 0}, "score": 4.423082401944417}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9599112948379296, "4": 0.04007721542673167, "3": 1.133273633190841e-05, "2": 3.831601047658313e-08, "1": 0}, "score": 4.959899999393384}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9949073318299657, "4": 0.005091896115537002, "3": 7.921587684561833e-07, "1": 0, "2": 0}, "score": 4.9949065196693265}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"4": 0.788664555497089, "5": 0.2108651182317534, "3": 0.00046994259923772237, "2": 2.849967671714972e-07, "1": 0}, "score": 4.2103946263997045}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9502825267710963, "5": 0.04534370143222999, "3": 0.004339973660054966, "2": 3.359931090450224e-05, "1": 1.237186253707437e-07}, "score": 4.040936161069085}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6918558045536563, "4": 0.307988633780368, "3": 0.00015538339174033593, "2": 1.8789604108772788e-07, "1": 0}, "score": 4.69170003871443}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999083813732428, "4": 9.157172618811315e-05, "3": 1.4079837886861805e-08, "1": 0, "2": 0}, "score": 4.99990840011113}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997382703309112, "4": 0.0026161225504033126, "3": 1.1966183751192918e-06, "2": 1.371731408791946e-08, "1": 0}, "score": 4.997381443155683}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9897933361586473, "4": 0.010203296751315729, "3": 3.2251341876774365e-06, "2": 1.696521102403127e-08, "1": 0}, "score": 4.989790200808547}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9939675298559584, "4": 0.0060319333363721165, "3": 5.394800670561565e-07, "1": 0, "2": 0}, "score": 4.993966987719618}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6013732794460463, "5": 0.39783160350658425, "3": 0.0007944329247756251, "2": 5.955657755062783e-07, "1": 0}, "score": 4.397036014610504}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9985404733465318, "4": 0.0014593005987371568, "3": 1.6722025521545555e-07, "1": 0, "2": 0}, "score": 4.998540364874877}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.980973000717402, "4": 0.019021917728543117, "3": 5.078868791546117e-06, "2": 1.4506964391011307e-08, "1": 0}, "score": 4.980967881237973}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6543861227402349, "4": 0.34527361131300754, "3": 0.00033899303381949186, "2": 1.1290443398581993e-06, "1": 6.809091768585915e-08}, "score": 4.6540447169069745}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7720015123165639, "4": 0.22778312701626657, "3": 0.00021484214689116668, "2": 4.438048048035951e-07, "1": 3.406198104551615e-08}, "score": 4.771785711749905}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.975433310192176, "3": 0.01648289668871895, "5": 0.00807328916848839, "2": 1.0421881205272955e-05, "1": 5.308879223486376e-08}, "score": 3.991569389206658}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981831971879076, "4": 0.0018165902937434975, "3": 1.4157262509172642e-07, "1": 0, "2": 0}, "score": 4.9981831264321075}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5338322649209211, "4": 0.4658921543843176, "3": 0.00027507961310372893, "2": 4.783572493641472e-07, "1": 2.8196781407556263e-08}, "score": 4.533556141083156}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5208114358976693, "5": 0.47870346225032506, "3": 0.000483753779853579, "2": 1.2183086665127081e-06, "1": 0}, "score": 4.478217333908287}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5081691776371514, "5": 0.49149839741521384, "3": 0.00033199023570745393, "2": 3.6137233906469995e-07, "1": 0}, "score": 4.491165720456719}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6688796703361083, "5": 0.3306751187355022, "3": 0.00044492047483687226, "2": 2.571012142024986e-07, "1": 0}, "score": 4.33022969507217}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.626451701622542, "4": 0.3727921698546691, "3": 0.0007524737843659469, "2": 3.3032953395714062e-06, "1": 0}, "score": 4.625692841142918}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9314684272871526, "5": 0.06533053114351792, "3": 0.0031724303909606796, "2": 2.7967735941127038e-05, "1": 6.240015403939392e-07}, "score": 4.062100294483338}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7901907634100132, "4": 0.16056240432276708, "2": 0.04894785652670667, "5": 0.000271838613630586, "1": 2.6996994850170272e-05}, "score": 3.1121042467430176}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8314429197746133, "4": 0.1685011675725131, "3": 5.5837604488031856e-05, "2": 3.0776666969200805e-08, "1": 0}, "score": 4.831387057423726}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7375204222242718, "5": 0.26226123285538727, "3": 0.00021806726232270795, "2": 1.3270701943286162e-07, "1": 0}, "score": 4.262042938162412}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9917658736686323, "4": 0.00823322320513753, "3": 9.012050723178305e-07, "1": 0, "2": 0}, "score": 4.991764974368897}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992405694534574, "4": 0.0007592855747620711, "3": 1.366510828971002e-07, "1": 0, "2": 0}, "score": 4.9992404411167515}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9682807701060422, "4": 0.03167475777507222, "3": 4.4075829925974624e-05, "2": 2.7336170280284296e-07, "1": 3.736292254746893e-08}, "score": 4.968236118310422}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9257428395258677, "4": 0.07418600191817203, "3": 7.083077334023863e-05, "2": 2.0723529466918075e-07, "1": 3.870922086677486e-08}, "score": 4.92567155390948}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9756014308553961, "4": 0.02437153807201258, "3": 2.6754817697429012e-05, "2": 1.9044602802037152e-07, "1": 5.849830836291212e-08}, "score": 4.975574146294192}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993440144526594, "4": 0.0006554211184421255, "3": 4.722562954011834e-07, "2": 1.050328260073139e-08, "1": 0}, "score": 4.999343602805512}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9792511432125626, "4": 0.020731514434355083, "3": 1.7264796742463284e-05, "2": 8.810540104832817e-08, "1": 4.554008089326653e-08}, "score": 4.979233510660408}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8337466164428488, "5": 0.16564838495950499, "3": 0.0006044071486229779, "2": 4.4865909117783974e-07, "1": 0}, "score": 4.165043104059193}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9958195989051497, "4": 0.004178803572879376, "3": 1.5475043831261117e-06, "2": 3.847908819422382e-09, "1": 0}, "score": 4.995818089681552}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9296366017539758, "4": 0.07032254743069957, "3": 4.0689641764809965e-05, "2": 6.637595297822466e-08, "1": 0}, "score": 4.929595867483768}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9875711758442148, "4": 0.012426947237036948, "3": 1.8028965355475468e-06, "2": 8.420909482303228e-09, "1": 0}, "score": 4.987569420891702}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9965874003995409, "4": 0.0034120909288030176, "3": 4.7660060636987684e-07, "1": 0, "2": 0}, "score": 4.996586955760524}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7005056833232103, "5": 0.29888212921126733, "3": 0.0006112405361965999, "2": 8.214621292867922e-07, "1": 3.229672516301098e-08}, "score": 4.298269176650516}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9990564649394003, "4": 0.0009433438572140803, "3": 1.3361183425684741e-07, "1": 0, "2": 0}, "score": 4.999056388864774}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9791670134854389, "3": 0.012340527675912172, "5": 0.008488325755917661, "2": 4.212105148385437e-06, "1": 2.7424913084419576e-08}, "score": 3.996139292005932}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9898013980582023, "4": 0.010198027089484845, "3": 5.185963510612194e-07, "1": 0, "2": 0}, "score": 4.989800935144055}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7958364492619917, "5": 0.199462366409156, "3": 0.004689965746822405, "2": 1.0975972417135305e-05, "1": 1.4627769518150766e-07}, "score": 4.194750028645057}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8054760499131578, "5": 0.19393541261800157, "3": 0.0005882310765117714, "2": 2.8947381299516495e-07, "1": 0}, "score": 4.193346605865}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6138104265842493, "4": 0.38603410828055357, "3": 0.00015538121638807904, "2": 1.1769786054890201e-07, "1": 0}, "score": 4.613654789243465}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7824710688241717, "5": 0.21467141977113877, "3": 0.0028519166555964256, "2": 5.39246472606398e-06, "1": 5.0441933192903864e-08}, "score": 4.211808599021824}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996854406241779, "4": 0.00031441807770516496, "3": 4.2965000265576395e-08, "1": 0, "2": 0}, "score": 4.999685495961369}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989844979715279, "4": 0.0010151849158279347, "3": 2.715186520315797e-07, "1": 0, "2": 0}, "score": 4.998984272000556}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9551103704761752, "4": 0.04487562969821254, "3": 1.3845254768915005e-05, "2": 6.30481573613882e-08, "1": 0}, "score": 4.955096486538087}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5090119170671948, "4": 0.4906720485055209, "3": 0.0003156637478513781, "2": 2.960815244809132e-07, "1": 0}, "score": 4.508695699103929}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8768154517970083, "5": 0.12212371386189104, "3": 0.0010599579939419884, "2": 7.233591416616173e-07, "1": 0}, "score": 4.121062327670751}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9877254781173218, "4": 0.012272374723352953, "3": 2.0131256378807974e-06, "1": 0, "2": 0}, "score": 4.9877235973799205}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.994218579108696, "4": 0.00578088669860798, "3": 4.924474906440466e-07, "1": 0, "2": 0}, "score": 4.994218128165046}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9989828307676905, "4": 0.0010169722992455403, "3": 1.8201695406589228e-07, "1": 0, "2": 0}, "score": 4.998982663651672}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9071509635443668, "4": 0.09282166568554198, "3": 2.730537469161493e-05, "2": 1.8048594901316425e-08, "1": 0}, "score": 4.907123665021893}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9685008834032341, "4": 0.03148413534062257, "3": 1.4857986883878365e-05, "2": 1.0493004918811444e-08, "1": 0}, "score": 4.9684861136525775}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998418850414879, "4": 0.00015801951814555868, "3": 2.48161298007309e-08, "1": 0, "2": 0}, "score": 4.999841930838432}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999906712677533, "4": 9.324771535080028e-05, "3": 1.9040510423225575e-08, "1": 0, "2": 0}, "score": 4.99990671420171}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9333719101850352, "5": 0.06490900584194838, "3": 0.0017159845181743245, "2": 3.0141430410827304e-06, "1": 4.4523976282758644e-08}, "score": 4.063186862043018}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9953926624933619, "4": 0.004606794500265036, "3": 5.707782822401693e-07, "2": 1.8068081525675797e-09, "1": 0}, "score": 4.995392058659042}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8279767042139342, "4": 0.17191623957443058, "3": 0.00010686031966518468, "2": 2.2284285499841847e-07, "1": 0}, "score": 4.827869375896746}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996774601971498, "4": 0.00032245821371478016, "3": 6.312505992780328e-08, "1": 0, "2": 0}, "score": 4.999677415530209}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995506012798684, "4": 0.00044925944886041236, "3": 9.371580362226558e-08, "1": 0, "2": 0}, "score": 4.999550553099057}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9785481533126731, "4": 0.021449681118264303, "3": 2.16561970411811e-06, "2": 6.819293246543698e-09, "1": 0}, "score": 4.978545967331835}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8196504828638846, "4": 0.18028664905808056, "3": 6.274773978271875e-05, "2": 1.1072014892703143e-07, "1": 0}, "score": 4.819587521566681}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9990658695017917, "4": 0.0009340178580036124, "3": 1.1327753131597354e-07, "1": 0, "2": 0}, "score": 4.999065755587529}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995626318333539, "4": 0.0004372018806906236, "3": 1.2075392980190402e-07, "1": 0, "2": 0}, "score": 4.999562556591533}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989350084065093, "4": 0.00106482437449159, "3": 1.3626204549609021e-07, "1": 0, "2": 0}, "score": 4.998934903068445}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9875610572417848, "4": 0.012435993617667732, "3": 2.794392017678669e-06, "2": 9.395960256411053e-09, "1": 0}, "score": 4.987558387601996}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9965453707105195, "4": 0.0034539847998693697, "3": 6.407451762613619e-07, "2": 6.434504497683793e-09, "1": 0}, "score": 4.99654471441556}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8954593608767272, "4": 0.10450761911956727, "3": 3.299788795201714e-05, "2": 2.7127225021704555e-08, "1": 0}, "score": 4.8954263042469215}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999658339276736, "4": 3.4020101073453084e-05, "3": 1.3158643419333424e-08, "1": 0, "2": 0}, "score": 4.999965953577118}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9567539998704354, "4": 0.043237504527781516, "3": 8.4689840785051e-06, "2": 2.7127225021704555e-08, "1": 0}, "score": 4.956745476144426}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8968558967965788, "5": 0.095984294486217, "3": 0.007153367887219299, "2": 6.3289070414136105e-06, "1": 7.644380050585759e-08}, "score": 4.0888180426047}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.897546427636992, "5": 0.09809224181429356, "3": 0.004351279235444781, "2": 9.643378923691353e-06, "1": 1.5335727607592646e-07}, "score": 4.093721239608452}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987144018901963, "4": 0.0012851639258709372, "3": 4.30790906624901e-07, "1": 0, "2": 0}, "score": 4.998713974487953}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9762933814411586, "4": 0.02370225707840295, "3": 4.282279914054409e-06, "1": 0, "2": 0}, "score": 4.976289176483861}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7472023328124807, "4": 0.25242151759188214, "3": 0.00037434160315697953, "2": 1.3276607485165723e-06, "1": 0}, "score": 4.746825694611906}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8466057830557243, "4": 0.13658038999780772, "2": 0.01652644093118231, "5": 0.00028502091341053225, "1": 2.396483747823034e-06}, "score": 3.120619194140694}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5861569045736653, "4": 0.4133311050804874, "3": 0.0005084157701257218, "2": 3.412112353328272e-06, "1": 9.306478252560062e-08}, "score": 4.585641426027172}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6447037113329707, "5": 0.3548243857263618, "3": 0.00047110639393426504, "2": 7.361146175318923e-07, "1": 0}, "score": 4.354351828517424}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999581569766358, "4": 0.0004182634754362882, "3": 8.04676175429492e-08, "1": 0, "2": 0}, "score": 4.999581575553223}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9936698818514531, "4": 0.0063287704715151395, "3": 1.2981154488416403e-06, "2": 7.593129588675211e-09, "1": 0}, "score": 4.993668610252481}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9273495295061674, "3": 0.045206423021226225, "5": 0.02647818745078206, "2": 0.0009623291635226335, "1": 3.387948439011442e-06}, "score": 3.9793369393042384}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8873307589125997, "4": 0.11261668442091792, "3": 5.20776856195569e-05, "2": 4.485709383277247e-07, "1": 0}, "score": 4.887277811067156}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9376285786329814, "5": 0.05338114955098517, "3": 0.008965458768045916, "2": 2.4506602179540098e-05, "1": 1.5287289690377726e-07}, "score": 4.044366225773341}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9914759782510973, "4": 0.008522709263626875, "3": 1.2967285048804531e-06, "2": 8.957595547917683e-09, "1": 0}, "score": 4.991474670348611}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9689146611096157, "4": 0.031082031252616008, "3": 3.2605391266036997e-06, "2": 1.5635060132897997e-08, "1": 0}, "score": 4.968911399785791}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6710902636296505, "4": 0.32860400019667724, "3": 0.0003052971479689384, "2": 4.741505261250384e-07, "1": 2.362670965111855e-08}, "score": 4.670783907890919}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996873472660559, "4": 0.00031250549654453154, "3": 9.764630691009405e-08, "1": 0, "2": 0}, "score": 4.999687299195335}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9827393506643843, "4": 0.017246873470830173, "3": 1.3683908192284548e-05, "2": 5.628279182177175e-08, "1": 0}, "score": 4.982725589248167}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989087183813413, "4": 0.0010909105112654781, "3": 3.403599850122663e-07, "1": 0, "2": 0}, "score": 4.998908408735201}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9953496813707934, "4": 0.004647415594584888, "3": 2.8470704631778243e-06, "2": 2.378297139398772e-08, "1": 0}, "score": 4.995346818765829}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5088967152582233, "4": 0.4906096389902803, "3": 0.000492477393464778, "2": 1.0598215638510146e-06, "1": 4.730574925989473e-08}, "score": 4.508402007434203}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994382168365917, "4": 0.005615537329503901, "3": 2.325494159007732e-06, "2": 1.3370300104149336e-08, "1": 0}, "score": 4.994379771821714}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6163992082570076, "4": 0.3831867541106348, "3": 0.00041234507437874144, "2": 1.4359197116623043e-06, "1": 0}, "score": 4.61598414942831}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9822714590018212, "4": 0.01772586157228481, "3": 2.729126399940862e-06, "1": 0, "2": 0}, "score": 4.982268681056171}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992846056166711, "4": 0.0007149485327706903, "3": 4.29592393463096e-07, "1": 0, "2": 0}, "score": 4.999284192270806}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5979009943654938, "5": 0.40141480495664866, "3": 0.0006834268023002255, "2": 6.07625559975786e-07, "1": 0}, "score": 4.400730229524628}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9990871652873251, "4": 0.0009126026369350189, "3": 1.6447898922080816e-07, "1": 0, "2": 0}, "score": 4.999087068343375}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5209929338441077, "4": 0.47875978502578115, "3": 0.0002470408130415653, "2": 1.7258775589639058e-07, "1": 0}, "score": 4.520745583125295}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978184562330283, "4": 0.002181270660927377, "3": 2.441905436039861e-07, "1": 0, "2": 0}, "score": 4.997818240894899}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.800342698431797, "5": 0.19900267741528258, "3": 0.0006507623735364419, "2": 3.654888395411003e-06, "1": 8.65656284741685e-08}, "score": 4.198344369433928}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9974261124434852, "4": 0.0025736169395924953, "3": 2.2177222395763004e-07, "1": 0, "2": 0}, "score": 4.99742593939023}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9977694471883944, "4": 0.0022303383021860185, "3": 1.8068096233315285e-07, "1": 0, "2": 0}, "score": 4.997769300260429}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6006052993771833, "4": 0.3992340869655247, "3": 0.0001604230772100435, "2": 1.4889224210359063e-07, "1": 0}, "score": 4.600444603546729}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999367496503877, "4": 6.310503484997813e-05, "3": 4.576450711862308e-08, "1": 0, "2": 0}, "score": 4.999936803429845}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9730930804605479, "4": 0.02690526733050459, "3": 1.350631901286286e-06, "1": 0, "2": 0}, "score": 4.973092023290865}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7451694029059639, "5": 0.2542458923837755, "3": 0.0005841111312518731, "2": 4.1018030730730936e-07, "1": 0}, "score": 4.253661007413009}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7980170227443579, "3": 0.196980901823894, "5": 0.004184606105583261, "2": 0.0008164260656422331, "1": 9.739274721384634e-07}, "score": 3.8055679168874192}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9767691416031742, "4": 0.023226411990124936, "3": 4.4072440316204034e-06, "2": 5.290008416799817e-09, "1": 0}, "score": 4.976764756864746}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6090587294764277, "4": 0.3907526218164711, "3": 0.0001880937592572656, "2": 5.464161347143405e-07, "1": 2.8946168226854284e-08}, "score": 4.608869443616657}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7048475927758637, "5": 0.2942240579573201, "3": 0.0009195753229343031, "2": 8.376352506318666e-06, "1": 1.8785151500253956e-07}, "score": 4.293287227888851}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8547009049655269, "4": 0.14525335288077695, "3": 4.562380217978513e-05, "2": 6.257187130497647e-08, "1": 0}, "score": 4.8546552036919675}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5452440971011451, "4": 0.4544818955188074, "3": 0.00027355167890581397, "2": 3.397759184487428e-07, "1": 0}, "score": 4.544969929046164}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9801678955516268, "5": 0.015431870423884242, "3": 0.004398226005171194, "2": 1.932606399585908e-06, "1": 0}, "score": 4.011029780037703}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960405927051188, "4": 0.003958965203940304, "3": 4.7201220200004203e-07, "1": 0, "2": 0}, "score": 4.99604009089014}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9844406402820586, "4": 0.015549952422622483, "3": 9.26961232174968e-06, "2": 6.147735139266326e-08, "1": 0}, "score": 4.984431322734259}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"2": 0.9130583447436492, "3": 0.08306528617135399, "1": 0.003646335092735509, "4": 0.0002273947645499874, "5": 2.606101842545738e-06}, "score": 2.0798815615593917}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9678875140031804, "4": 0.032085437891998456, "3": 2.6719204004241264e-05, "2": 9.330921187912029e-08, "1": 0}, "score": 4.967860836200639}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9045325030197496, "4": 0.09544328330628443, "3": 2.411831614763842e-05, "2": 1.3254880668495037e-08, "1": 0}, "score": 4.904508432456639}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981722797187111, "4": 0.0018271827120337055, "3": 4.653469874802926e-07, "1": 0, "2": 0}, "score": 4.998171886461961}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9696955313142825, "4": 0.03029227952770385, "3": 1.2014767977882067e-05, "2": 3.063931036490911e-08, "1": 0}, "score": 4.969683594660404}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9979091468849978, "4": 0.002089707865600093, "3": 1.0959434143653275e-06, "2": 1.539630948618809e-08, "1": 0}, "score": 4.997908053987706}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9598340730805467, "4": 0.040146821795160305, "3": 1.8980811692927503e-05, "2": 4.3676702525138556e-08, "1": 0}, "score": 4.959815082311}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9811955910836696, "4": 0.018801882146157644, "3": 2.4918877554692897e-06, "2": 1.117729889422185e-08, "1": 0}, "score": 4.981193100100615}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999961110815618, "4": 3.8652662146174766e-06, "3": 3.347891808848763e-09, "1": 0, "2": 0}, "score": 4.999996128037922}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998634540532465, "4": 0.00013634024432553939, "3": 7.407261063731973e-08, "1": 0, "2": 0}, "score": 4.999863511592488}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7089281198709935, "4": 0.29083031263002795, "3": 0.00024126853299284682, "2": 3.224831339202092e-07, "1": 0}, "score": 4.708686189705455}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8546814009134177, "3": 0.13687910335656225, "5": 0.00805015929136689, "2": 0.0003890789027815646, "1": 9.085236595597639e-08}, "score": 3.870392603968728}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962089084018817, "4": 0.0037903913751811, "3": 7.517432456150597e-07, "1": 0, "2": 0}, "score": 4.996208105333687}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9787952375756377, "4": 0.021197049108239215, "3": 7.687161179610052e-06, "2": 2.7986152574851392e-08, "1": 0}, "score": 4.978787492649789}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999573707926505, "4": 4.260201522741374e-05, "3": 8.074620224220253e-09, "1": 0, "2": 0}, "score": 4.999957381834717}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8649927963534688, "4": 0.13498297764667783, "3": 2.4179122590882517e-05, "2": 4.868372751320625e-08, "1": 0}, "score": 4.864968518300886}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9622944346693093, "4": 0.037688359454194915, "3": 1.7094957858706034e-05, "2": 6.803041175890582e-08, "1": 0}, "score": 4.96227724492099}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9264215781114791, "4": 0.07355384175912688, "3": 2.4477701443755764e-05, "2": 3.20614969088109e-08, "1": 0}, "score": 4.926397101474321}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9976790219444912, "4": 0.0023208248910780304, "3": 1.9058815376358558e-07, "1": 0, "2": 0}, "score": 4.997678794019484}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6591895190583498, "5": 0.33995782948189684, "3": 0.000849348477030992, "2": 3.171835866542634e-06, "1": 6.357503341745902e-08}, "score": 4.33910196952177}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6538473464399154, "5": 0.3432598288758859, "3": 0.0028909089810382903, "2": 1.903290171865088e-06, "1": 0}, "score": 4.340365117539453}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9956803615924384, "4": 0.004318757646130337, "3": 8.27656188561018e-07, "1": 0, "2": 0}, "score": 4.995679586812056}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9942842146146361, "4": 0.005713142822442263, "3": 2.640231381867067e-06, "2": 6.2527529386038356e-09, "1": 0}, "score": 4.99428155797896}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999368688428554, "4": 6.303074088666067e-05, "3": 2.771206386421728e-08, "1": 0, "2": 0}, "score": 4.999936913830399}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9966927809367415, "4": 0.0033055007642007533, "3": 1.7379175010465097e-06, "1": 0, "2": 0}, "score": 4.996691023465713}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8799406825279718, "4": 0.11979940019893591, "3": 0.00025770990625724303, "2": 1.9704157438349164e-06, "1": 1.471794862614472e-07}, "score": 4.879678669221935}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9713676092755127, "3": 0.014594405626000203, "5": 0.013937956178520346, "2": 9.959824639546023e-05, "1": 4.738969234383287e-07}, "score": 3.999142932406004}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7857559507465128, "5": 0.21274196065461926, "3": 0.0014997460278140106, "2": 2.1073759711006374e-06, "1": 4.542496468953393e-08}, "score": 4.2112379036866106}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9608434447228774, "4": 0.03914060342658756, "3": 1.5739107802994107e-05, "2": 6.436016185416215e-08, "1": 0}, "score": 4.960827719464838}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8969431471820091, "5": 0.09795024826356062, "3": 0.005098909936694996, "2": 7.548142888449225e-06, "1": 1.2560220843320182e-07}, "score": 4.092835867172194}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5553945593890297, "5": 0.44358869877118684, "3": 0.0010137499518820042, "2": 2.719582995194214e-06, "1": 9.614359324971191e-08}, "score": 4.442569299186125}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9992416414692925, "4": 0.0007580607730561282, "3": 2.616754085287584e-07, "1": 0, "2": 0}, "score": 4.999241415848755}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8984150263668824, "4": 0.10149834358429592, "3": 8.645884825021653e-05, "2": 1.3654453661089387e-07, "1": 0}, "score": 4.898328325562058}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9828017536461136, "4": 0.0171947529972826, "3": 3.4444786507560456e-06, "2": 1.1308682991202311e-08, "1": 0}, "score": 4.982798323473113}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9939710697782227, "4": 0.006028078353766657, "3": 8.482096524911241e-07, "1": 0, "2": 0}, "score": 4.993970225204869}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8038826244103874, "4": 0.19597677924694495, "3": 0.00014019980138774333, "2": 2.44883071379951e-07, "1": 0}, "score": 4.803742056736938}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9912705984218071, "4": 0.008726228661549498, "3": 3.1248383628551104e-06, "2": 6.3756805414466185e-09, "1": 0}, "score": 4.9912675021705155}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8343404637587479, "4": 0.16561277438501265, "3": 4.660829632282325e-05, "2": 3.3204746645280244e-08, "1": 0}, "score": 4.834293889464514}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994616477336113, "4": 0.0005382046391271783, "3": 1.1616828086180127e-07, "1": 0, "2": 0}, "score": 4.999461563007372}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993287775306565, "4": 0.0006707067840699612, "3": 3.977902422951332e-07, "1": 0, "2": 0}, "score": 4.999328497556279}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6495633961588013, "3": 0.34819657082073635, "5": 0.0012417144913959143, "2": 0.000997798705392595, "1": 4.362148237145059e-07}, "score": 3.6510482084399456}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999820452021894, "4": 1.788046109929949e-05, "3": 2.8522887550904423e-08, "1": 0, "2": 0}, "score": 4.999982062492304}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9038162070913932, "4": 0.09615748142903734, "3": 2.6189761657540023e-05, "2": 3.359286982788075e-08, "1": 0}, "score": 4.903790029790531}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990819360787868, "4": 0.000917225688362262, "3": 7.836698617405243e-07, "1": 0, "2": 0}, "score": 4.999081206921781}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999504572972803, "4": 4.9469116113785155e-05, "3": 4.295911446372654e-08, "1": 0, "2": 0}, "score": 4.999950444964139}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9996931864469076, "4": 0.0003066581342727521, "3": 5.638486869426989e-08, "1": 0, "2": 0}, "score": 4.999693229065609}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986857439918653, "4": 0.0013139580300907951, "3": 2.279822641120333e-07, "1": 0, "2": 0}, "score": 4.998685585913377}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9157651716519091, "4": 0.0842066569243279, "3": 2.8144911035154556e-05, "2": 4.041329588736302e-08, "1": 0}, "score": 4.915736933185018}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999282867615172, "4": 7.164974232485854e-05, "3": 1.170222315435716e-08, "1": 0, "2": 0}, "score": 4.999928326849516}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998539191008537, "4": 0.0001460077288979345, "3": 1.112678024137036e-08, "1": 0, "2": 0}, "score": 4.9998539700084805}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9322126827078216, "3": 0.05119162164874789, "5": 0.016291571350019844, "2": 0.00030227541076297465, "1": 1.725715173616808e-06}, "score": 3.9644902173605754}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9384307947045417, "5": 0.03297305388541961, "3": 0.028263931288188007, "2": 0.00033057136221449884, "1": 1.3964601326742656e-06}, "score": 4.004043791512651}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.593731281514828, "4": 0.40609144936614244, "3": 0.00017704599506919338, "2": 2.1076691127205385e-07, "1": 0}, "score": 4.593553821320509}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986671948747254, "4": 0.001332714685606764, "3": 8.029287096077069e-08, "1": 0, "2": 0}, "score": 4.998667124715127}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9955729424374301, "4": 0.004426603912922817, "3": 4.787654621758678e-07, "1": 0, "2": 0}, "score": 4.995572438667354}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9166615764212938, "4": 0.08327309259984152, "3": 6.508834871237909e-05, "2": 2.054079161559724e-07, "1": 0}, "score": 4.916596111374507}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998375943892193, "4": 0.00016227518354038927, "3": 4.031698470830407e-08, "1": 0, "2": 0}, "score": 4.99983764416786}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6606599825774594, "5": 0.33551513896392127, "3": 0.0038170229219899186, "2": 7.547063581188488e-06, "1": 0}, "score": 4.331683124230072}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999191774530297, "4": 0.0008079010256124212, "3": 2.4974011494521206e-07, "1": 0, "2": 0}, "score": 4.999191599433766}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976113896804891, "4": 0.0023880033036851396, "3": 5.85469937635307e-07, "2": 4.556586811230178e-09, "1": 0}, "score": 4.997610812046088}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.965180386593293, "5": 0.03351170829061667, "3": 0.00130759657816463, "2": 2.5984436014479125e-07, "1": 0}, "score": 4.032203593591839}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9829317741415192, "4": 0.017065216669254948, "3": 2.9854233362085118e-06, "2": 8.38588417502696e-09, "1": 0}, "score": 4.982928787063864}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9100143275816194, "5": 0.08860437884168292, "3": 0.0013805711342957455, "2": 6.690593943277453e-07, "1": 0}, "score": 4.087222474244797}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997507311526429, "4": 0.00024913814902282217, "3": 1.6356442181343374e-08, "1": 0, "2": 0}, "score": 4.999750829109603}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7890257598000138, "4": 0.21094640131056314, "3": 2.7775478357350778e-05, "2": 2.8859113538330344e-08, "1": 0}, "score": 4.788997953864849}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9910642329063579, "4": 0.008931436810533884, "3": 4.25345484734002e-06, "2": 5.107268616301028e-08, "1": 0}, "score": 4.991059902831456}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.680520454021455, "5": 0.31833964504486756, "3": 0.0011392450190051454, "2": 6.245109334550046e-07, "1": 0}, "score": 4.317199160965235}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.917674166335156, "3": 0.05877660954931743, "5": 0.023462182720388657, "2": 8.658421792972846e-05, "1": 2.555987512546891e-07}, "score": 3.964511630785267}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9017848255347, "4": 0.09817460519180476, "3": 4.0444940606332895e-05, "2": 1.0497915818158997e-07, "1": 0}, "score": 4.901744188087892}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9625901450605441, "4": 0.03740519426927332, "3": 4.519753956519865e-06, "2": 2.0519011301351274e-08, "1": 0}, "score": 4.962585700161202}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7384449668230477, "5": 0.2610942306093813, "3": 0.0004603801484940485, "2": 3.9726669737603397e-07, "1": 1.6195360898634068e-08}, "score": 4.260633009675904}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9940075815905233, "4": 0.0059900854590697414, "3": 2.2430477818509043e-06, "2": 1.5417694401452898e-08, "1": 0}, "score": 4.994005381745774}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9825429875149363, "4": 0.01744702032374949, "3": 9.988965741926809e-06, "2": 1.567457286876949e-08, "1": 0}, "score": 4.98253295493902}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997923090607499, "4": 0.00020761918451159405, "3": 3.6296046988278415e-08, "1": 0, "2": 0}, "score": 4.99979230821603}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995955072092758, "4": 0.0004043897974474836, "3": 9.450217375621528e-08, "1": 0, "2": 0}, "score": 4.99959542119477}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9998692942427418, "4": 0.0001305867240253477, "3": 3.942971961650944e-08, "1": 0, "2": 0}, "score": 4.999869334406134}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7938059365612106, "5": 0.2031876586728407, "3": 0.0029937664561053424, "2": 1.225270290507366e-05, "1": 1.4119513036245523e-07}, "score": 4.200169012149203}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9929890611096576, "4": 0.007008686294441373, "3": 2.1854539359218234e-06, "2": 6.520139927272669e-09, "1": 0}, "score": 4.992986922812121}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998914561513098, "4": 0.00010843994939473, "3": 1.9182297278046534e-08, "1": 0, "2": 0}, "score": 4.999891521676821}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998421234138201, "4": 0.00015778818904141768, "3": 2.6489431362821158e-08, "1": 0, "2": 0}, "score": 4.999842158822324}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"4": 0.949878576278687, "5": 0.0299960371813547, "3": 0.019973323914736104, "2": 0.00015100750808020553, "1": 1.0590682985366694e-06}, "score": 4.009717521007167}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9639126022962579, "3": 0.018233312514932026, "5": 0.017776521663658878, "2": 7.72906938235025e-05, "1": 2.5368411135311175e-07}, "score": 3.999387866697026}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8573799069106199, "5": 0.1418768714494983, "3": 0.0007424166124937354, "2": 6.950576814037219e-07, "1": 0}, "score": 4.141133080242005}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987900219145083, "4": 0.0012098441854750809, "3": 1.3425632380152148e-07, "1": 0, "2": 0}, "score": 4.998789887302308}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9902483279445916, "4": 0.00975107054999961, "3": 5.834418776707229e-07, "1": 0, "2": 0}, "score": 4.990247762390085}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7365839238591971, "4": 0.26319220400801363, "3": 0.0002225230202304245, "2": 1.129762640453726e-06, "1": 5.985002423580933e-08}, "score": 4.736359079212807}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6422851853404749, "5": 0.3551659620563266, "3": 0.0025044177665098253, "2": 4.359775062979056e-05, "1": 7.515966699737545e-07}, "score": 4.352572124139723}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8704310589332842, "4": 0.12951924485044577, "3": 4.944720614876229e-05, "2": 2.437404274109089e-07, "1": 0}, "score": 4.870381128832924}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994247334992588, "4": 0.0005751949103983555, "3": 2.7374114400491945e-08, "1": 0, "2": 0}, "score": 4.999424750315937}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9910160004704484, "4": 0.008982886605926815, "3": 9.986594572954623e-07, "1": 0, "2": 0}, "score": 4.9910151150485085}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9958130953281684, "4": 0.004185772517836885, "3": 1.1742862990231916e-06, "1": 0, "2": 0}, "score": 4.995811879086021}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8026080751190672, "4": 0.19732897878058486, "3": 6.27232102123072e-05, "2": 4.714108137753041e-08, "1": 0}, "score": 4.802545398673288}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8875448044673168, "4": 0.11237794271166991, "3": 7.703505345695742e-05, "2": 1.1804888719687273e-07, "1": 0}, "score": 4.887467621813176}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9463522404836358, "4": 0.0536347017329871, "3": 1.2954426675561483e-05, "2": 3.6014291181537416e-08, "1": 0}, "score": 4.946339277757145}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9983199264063862, "4": 0.0016794952116044061, "3": 5.567586468450197e-07, "1": 0, "2": 0}, "score": 4.998319391234761}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9051384984770149, "4": 0.09480574218346553, "3": 5.558245300239189e-05, "2": 5.127579646014369e-08, "1": 0}, "score": 4.905082927160538}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998453414008744, "4": 0.00015448678488649798, "3": 7.188523125958243e-08, "1": 0, "2": 0}, "score": 4.9998453694292}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.781966913057583, "4": 0.2179057171241774, "3": 0.0001272317921501856, "2": 1.7608147903035392e-07, "1": 0}, "score": 4.781839299349276}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998998773362203, "4": 0.0010010704515068147, "3": 9.857580409756634e-08, "1": 0, "2": 0}, "score": 4.998998732339202}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997087511348253, "4": 0.0029116160741732215, "3": 8.735329380107026e-07, "1": 0, "2": 0}, "score": 4.9970866368627345}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9997994598108725, "4": 0.00020041126054256935, "3": 4.396319633398429e-08, "1": 0, "2": 0}, "score": 4.99979950079603}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8994949408588259, "4": 0.10038779930252052, "3": 0.00011653079326658687, "2": 6.303730814878243e-07, "1": 6.991147766291434e-08}, "score": 4.899376965451789}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9692443467990787, "3": 0.01738849323249247, "5": 0.013337967652348461, "2": 2.8791913255234466e-05, "1": 1.939607534796715e-07}, "score": 3.995891307862878}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986486532923785, "4": 0.001351074063855578, "3": 2.880343768129266e-07, "1": 0, "2": 0}, "score": 4.998648349888193}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9919251313250896, "4": 0.008072642523924457, "3": 2.1124650969614507e-06, "2": 1.5544483812528327e-08, "1": 0}, "score": 4.99192308511975}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6752459055053444, "5": 0.3233882710894691, "3": 0.0013627998258034578, "2": 2.8365954787068765e-06, "1": 9.167950346062936e-08}, "score": 4.322019553724078}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998542766686762, "4": 0.00014563865060170287, "3": 1.3561851804560399e-08, "1": 0, "2": 0}, "score": 4.9998543342153345}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8184649707265143, "4": 0.1814482481673255, "3": 8.665641595972214e-05, "2": 1.8796989874395434e-07, "1": 0}, "score": 4.818377886584051}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998905030816723, "4": 0.001094879464341135, "3": 4.954081310100538e-08, "1": 0, "2": 0}, "score": 4.998905021410039}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989710563259455, "4": 0.0010287946548638554, "3": 1.415271875721841e-07, "1": 0, "2": 0}, "score": 4.998970922283051}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5375688414850569, "4": 0.23374308362994375, "2": 0.22414632584864405, "5": 0.0036512014542605343, "1": 0.0008902439781970021}, "score": 3.0151186773235166}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9036060996714453, "4": 0.09634512328355244, "3": 4.835881675252291e-05, "2": 2.8534581678930327e-07, "1": 0}, "score": 4.90355729022995}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9822653630440624, "4": 0.017732582720319974, "3": 2.032600602143091e-06, "1": 0, "2": 0}, "score": 4.982263351694743}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999619003488102, "4": 3.806322366993828e-05, "3": 7.829008212786847e-09, "1": 0, "2": 0}, "score": 4.999961921117225}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9640264760177861, "4": 0.03596953315827704, "3": 3.912707376204074e-06, "2": 8.98333179053143e-09, "1": 0}, "score": 4.964022611989742}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9906170333430588, "4": 0.009381023563584901, "3": 1.8542541838041459e-06, "2": 6.2329755612009775e-09, "1": 0}, "score": 4.990615248453882}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986227389956558, "4": 0.0013769009411306753, "3": 2.9639020222259646e-07, "1": 0, "2": 0}, "score": 4.998622506190755}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.769351428283252, "5": 0.22922363039530058, "3": 0.0014237338308519187, "2": 1.1371652672236514e-06, "1": 2.0565313315591334e-08}, "score": 4.227797571873184}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997745552364907, "4": 0.00022533621099119064, "3": 2.423320589238709e-08, "1": 0, "2": 0}, "score": 4.9997746153035925}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999753699393249, "4": 2.458797636896429e-05, "3": 1.908311355528719e-08, "1": 0, "2": 0}, "score": 4.999975373856838}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9726745828122166, "4": 0.0273086166059293, "3": 1.6700999333543156e-05, "2": 3.359407919296304e-08, "1": 0}, "score": 4.972657878808902}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9558391530825413, "4": 0.04411800514151187, "3": 4.261854801647561e-05, "2": 9.723627456371903e-08, "1": 0}, "score": 4.955796460484354}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.925748660615144, "5": 0.05543088220598037, "3": 0.018798823328774, "2": 2.1336549858945394e-05, "1": 2.528268423824788e-07}, "score": 4.036588628924182}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5952049077199625, "5": 0.4003554105520202, "3": 0.0044292788322246425, "2": 9.907415904326041e-06, "1": 0}, "score": 4.395906513051701}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8208794774510935, "5": 0.1742786541684855, "3": 0.004838396087763829, "2": 3.402629645956637e-06, "1": 3.9984258411581904e-08}, "score": 4.169433337897224}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8896500818738632, "4": 0.11030869779822966, "3": 4.103705988077684e-05, "2": 1.2794453336866492e-07, "1": 0}, "score": 4.889608838141184}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998570179529074, "4": 0.00014295652427194177, "3": 8.60553703142659e-09, "1": 0, "2": 0}, "score": 4.9998570262622355}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7145197573500877, "5": 0.2851350076005332, "3": 0.00034488863160097156, "2": 1.856263601516493e-07, "1": 0}, "score": 4.284789793507966}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999167249015635, "4": 8.311769022481797e-05, "3": 8.214416693794472e-08, "1": 0, "2": 0}, "score": 4.999916718015173}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998042270160321, "4": 0.00019564925835248702, "3": 3.6267094296442255e-08, "1": 0, "2": 0}, "score": 4.999804278190341}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.739555832014277, "5": 0.25940161012668356, "3": 0.001041182388088386, "2": 1.3513290071852056e-06, "1": 2.0122223216124485e-08}, "score": 4.2583576657524365}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9373396235356964, "4": 0.0626318089336419, "3": 2.847474511090934e-05, "2": 6.135329248453136e-08, "1": 0}, "score": 4.937311055545804}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5233921955811668, "4": 0.47640132510891553, "3": 0.00020633056310982338, "2": 1.5374983552752973e-07, "1": 0}, "score": 4.523185554900874}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999236381607137, "4": 7.62429199425758e-05, "3": 1.3097492988205129e-08, "1": 0, "2": 0}, "score": 4.999923730877001}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.996184187983779, "4": 0.003814514054299347, "3": 1.3197476683240949e-06, "2": 6.747484960084798e-09, "1": 0}, "score": 4.996182826316825}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8731234885965347, "4": 0.126818823205934, "3": 5.7634166368276534e-05, "2": 3.8112138871749423e-08, "1": 0}, "score": 4.873065792104245}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996339731841657, "4": 0.00036574777553868723, "3": 2.048321446087429e-07, "1": 0, "2": 0}, "score": 4.999633842533}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6166119889972055, "5": 0.3828251199317662, "3": 0.0005626067298099828, "2": 2.836343296706301e-07, "1": 0}, "score": 4.3822619462035135}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997491818801253, "4": 0.00025065952845406325, "3": 1.1443315311824022e-07, "1": 0, "2": 0}, "score": 4.999749111594162}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999691715222073, "4": 3.073476910741619e-05, "3": 1.1431947370838159e-08, "1": 0, "2": 0}, "score": 4.999969242364467}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7480391595787423, "5": 0.2507137572435976, "3": 0.0012445640139432238, "2": 2.3497514531939366e-06, "1": 3.358134944938761e-08}, "score": 4.2494644268676804}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998415274880953, "4": 0.00015825751656925886, "3": 9.472148387721396e-08, "1": 0, "2": 0}, "score": 4.999841553021406}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9782476873137063, "4": 0.021749389300055735, "3": 2.9061176745062957e-06, "1": 0, "2": 0}, "score": 4.978244798088915}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971730918511699, "4": 0.0028260050718827093, "3": 9.093843544127594e-07, "1": 0, "2": 0}, "score": 4.997172176177244}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9985454653623985, "4": 0.001454014394483409, "3": 4.51776160458848e-07, "1": 0, "2": 0}, "score": 4.998545081953581}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6711705845187078, "5": 0.3237284279509904, "3": 0.005073178676223447, "2": 2.7250300755959022e-05, "1": 3.1936410182975434e-07}, "score": 4.318599866786603}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9696650445660322, "4": 0.030326996183107916, "3": 7.872199937282149e-06, "2": 1.772797387571115e-08, "1": 0}, "score": 4.969657204129644}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9872257690510978, "4": 0.012772229950813294, "3": 1.9876748886497725e-06, "2": 2.582791619282784e-09, "1": 0}, "score": 4.9872237868138125}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999899125338788, "4": 9.955036041626229e-06, "3": 4.135920174896135e-09, "1": 0, "2": 0}, "score": 4.999990036690839}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995622743898207, "4": 0.00043759794628522473, "3": 1.1745506523930351e-07, "1": 0, "2": 0}, "score": 4.999562167139114}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.923110267685509, "3": 0.051258890645453165, "5": 0.02550586125736406, "2": 0.00012453833223624374, "1": 3.4938757529362855e-07}, "score": 3.9739968433744317}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997123652048218, "4": 0.0002874677149093531, "3": 1.146239576473756e-07, "1": 0, "2": 0}, "score": 4.999712303022084}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.964897063771118, "4": 0.0350915787131027, "3": 1.133457238391037e-05, "2": 1.7531299687550122e-08, "1": 0}, "score": 4.96488569935819}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996376671184192, "4": 0.0003621927606052679, "3": 6.933978481678618e-08, "1": 0, "2": 0}, "score": 4.999637668534178}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9849826472207515, "4": 0.015014762427745345, "3": 2.544839435827962e-06, "2": 6.601545821231876e-09, "1": 0}, "score": 4.984980127504314}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9303271504645332, "4": 0.06964623055738223, "3": 2.6491013385864284e-05, "2": 4.060344182163233e-08, "1": 0}, "score": 4.930300659516499}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.99948141775028, "4": 0.0005184867941259735, "3": 3.1735338429810035e-08, "1": 0, "2": 0}, "score": 4.999481449702155}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5862221885033958, "5": 0.41343232572681543, "3": 0.0003452881403808125, "2": 1.7308448656689928e-07, "1": 0}, "score": 4.413086701556642}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999447358231209, "4": 5.5226922341600085e-05, "3": 8.597795532295455e-09, "1": 0, "2": 0}, "score": 4.999944755880484}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7909462385177283, "4": 0.20865095393841634, "3": 0.0003994667600897187, "2": 3.0459765565247287e-06, "1": 8.356826451423679e-08}, "score": 4.790540596092693}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9179482210843167, "5": 0.07847746229017057, "3": 0.0035711225244325646, "2": 3.113531330168294e-06, "1": 3.2005182312279256e-08}, "score": 4.074900020325018}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9921975632740823, "4": 0.0078012648357762195, "3": 1.1862778618073654e-06, "1": 0, "2": 0}, "score": 4.992196362720777}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7827048513237461, "3": 0.21676015786294578, "5": 0.000404164412967168, "2": 0.00013067346240405522, "1": 1.0425104003107457e-07}, "score": 3.783382336325651}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9733187805397022, "4": 0.0266771896217263, "3": 3.966422512023462e-06, "2": 1.1952504487307463e-08, "1": 0}, "score": 4.9733148403024225}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9946216275152518, "4": 0.005377736598117139, "3": 5.746503891138312e-07, "1": 0, "2": 0}, "score": 4.994621113771722}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8824818296662224, "4": 0.11741302878734698, "3": 0.00010458901823899686, "2": 4.94353988730118e-07, "1": 2.9758530695242348e-08}, "score": 4.8823761877377265}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9327185033186761, "4": 0.0672223027738201, "3": 5.8849866072735045e-05, "2": 2.3280142499391028e-07, "1": 1.2120858808845184e-08}, "score": 4.932659243931566}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.678763105250963, "5": 0.32059808884711943, "3": 0.0006378264714103913, "2": 8.489980053915114e-07, "1": 0}, "score": 4.319958606112699}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912109742972848, "4": 0.008787834123318, "3": 1.1023525280259251e-06, "1": 0, "2": 0}, "score": 4.991209960387319}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9349033537586376, "4": 0.06507145533774875, "3": 2.499516879427295e-05, "2": 6.850137629378488e-08, "1": 0}, "score": 4.934878340534881}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9423352085376884, "3": 0.05496590472866963, "5": 0.0026742321140822197, "2": 2.458684534806501e-05, "1": 2.9155886683281666e-08}, "score": 3.947659064205737}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9165101527704634, "5": 0.07753299432466706, "3": 0.005919156046273073, "2": 3.712221427575787e-05, "1": 4.6755820186440853e-07}, "score": 4.071538198835985}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7056494461511421, "4": 0.29422805943171826, "3": 0.00012235046102491748, "2": 1.0475097189010978e-07, "1": 0}, "score": 4.705526913848456}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9633113277218405, "4": 0.03668631433029554, "3": 2.2672339357262355e-06, "2": 7.8407683779102e-09, "1": 0}, "score": 4.963309124638839}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9999723899261651, "5": 2.401218855676349e-05, "3": 3.0689778490405074e-06, "2": 1.8341600732307653e-07, "1": 0}, "score": 4.000020576385802}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5391734824639539, "5": 0.46003564655063717, "3": 0.0007889317837355474, "2": 1.7539380217760878e-06, "1": 0}, "score": 4.459243291971947}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7704659633148293, "5": 0.22887542936703317, "3": 0.0006580387748708591, "2": 4.5228559920649854e-07, "1": 0}, "score": 4.228216512552883}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6954947264737568, "5": 0.304004918022859, "3": 0.0004998962405385565, "2": 4.007776709220571e-07, "1": 0}, "score": 4.303504237977476}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995013036503816, "4": 0.0004984977909332415, "3": 8.501688101483248e-08, "1": 0, "2": 0}, "score": 4.999501332118685}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9886169156930509, "4": 0.011381546081246792, "3": 1.4121036712829004e-06, "1": 0, "2": 0}, "score": 4.988615628275591}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9636387676040622, "5": 0.02474879693093493, "3": 0.01160200559144909, "2": 1.0239262115320734e-05, "1": 8.50212169863305e-08}, "score": 4.013126059137588}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9839806054821397, "4": 0.01599522562035384, "3": 2.3962630586216356e-05, "2": 1.287193994276421e-07, "1": 1.7836480689908828e-08}, "score": 4.983956390656371}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8127051291470997, "4": 0.18697013140348848, "3": 0.0003236586975544961, "2": 9.558928612475878e-07, "1": 4.863798631107692e-08}, "score": 4.812379474670248}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8613366001595941, "4": 0.13853768451549905, "3": 0.00012506862141144836, "2": 5.340090770017849e-07, "1": 0}, "score": 4.861210560573652}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976240882569266, "4": 0.00237467023394783, "3": 1.2310968967613294e-06, "2": 7.942140608297724e-09, "1": 0}, "score": 4.997622843739965}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6618905956971294, "5": 0.3349145681928944, "3": 0.003182489267140955, "2": 1.192071398560103e-05, "1": 2.101996591617246e-07}, "score": 4.331707678524176}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9948117656217886, "4": 0.005187527978469301, "3": 7.28109782486574e-07, "1": 0, "2": 0}, "score": 4.9948110159146175}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9138244114449007, "3": 0.08419666218735034, "5": 0.0019239613794327305, "2": 5.4838941777545786e-05, "1": 6.435398357518634e-08}, "score": 3.917617423164185}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999434246564451, "4": 5.648265263302381e-05, "3": 1.597996638783569e-08, "1": 0, "2": 0}, "score": 4.999943485383098}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9766707692995041, "4": 0.023323643276660776, "3": 5.538427180222143e-06, "2": 5.8120813583654813e-08, "1": 0}, "score": 4.976665105719449}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7849743397111912, "5": 0.2085496576319176, "3": 0.006464471616186071, "2": 1.133931122551574e-05, "1": 9.470614023969408e-08}, "score": 4.202062242879613}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.880048156246278, "4": 0.11988309732366878, "3": 6.852862614945033e-05, "2": 1.498377192743347e-07, "1": 0}, "score": 4.879979387753531}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9981535055723129, "4": 0.001845548049130074, "3": 9.54897339642999e-07, "2": 3.1166472882719826e-09, "1": 0}, "score": 4.998152532827745}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996587550872944, "4": 0.0003411342715404599, "3": 2.1260839021888793e-08, "1": 0, "2": 0}, "score": 4.999658823176287}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994754607188552, "4": 0.0005243603600438767, "3": 1.506053496450544e-07, "1": 0, "2": 0}, "score": 4.999475338414401}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7022814004046917, "4": 0.2970160503669714, "3": 0.0007018906045894441, "2": 6.601696430694841e-07, "1": 0}, "score": 4.701578188376249}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9874584154798799, "4": 0.012534906581654627, "3": 6.5482416155434615e-06, "2": 8.698128059604531e-09, "1": 0}, "score": 4.987451969322435}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9951958082236633, "4": 0.004800493758521631, "3": 3.6750383131752803e-06, "2": 1.027584337130629e-08, "1": 0}, "score": 4.995192125276243}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9785968979673102, "4": 0.021401218913535164, "3": 1.8689963171220247e-06, "1": 0, "2": 0}, "score": 4.9785950427915315}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7496448184680116, "4": 0.25030292365734036, "3": 5.2184241271741234e-05, "2": 5.354545058808124e-08, "1": 0}, "score": 4.749592542193597}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8039068055634123, "4": 0.19595463512205666, "3": 0.00013810352125641232, "2": 3.550284179895824e-07, "1": 0}, "score": 4.803768072976895}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996225448341318, "4": 0.00037723772460405015, "3": 1.3169700098771458e-07, "1": 0, "2": 0}, "score": 4.999622498849026}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8643215889482352, "5": 0.1343874947818397, "3": 0.001289788019603879, "2": 1.014701578530823e-06, "1": 3.022292785850021e-08}, "score": 4.133095597780594}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967605189782099, "4": 0.0032384427416929924, "3": 9.746767104097308e-07, "2": 4.854984149437029e-09, "1": 0}, "score": 4.996759593149565}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9676955893256157, "4": 0.03229462730162882, "3": 9.723980566706515e-06, "2": 2.392736629011755e-08, "1": 0}, "score": 4.967685851809122}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7276850485594928, "4": 0.2712328234009429, "3": 0.0010801034018233448, "2": 2.014652165595223e-06, "1": 4.343570665995011e-08}, "score": 4.726600761241326}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9676920166000952, "3": 0.016880004892066525, "5": 0.01541615952359039, "2": 1.1767030058633767e-05, "1": 5.485689234785421e-08}, "score": 3.9985124560050473}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8690573851945094, "5": 0.12910907361267177, "3": 0.0018320286027450068, "2": 1.3687673057379669e-06, "1": 3.0055655219825604e-08}, "score": 4.127274231787972}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8307799671446606, "4": 0.16898130356024993, "3": 0.00023841779073289086, "2": 2.830948036986542e-07, "1": 0}, "score": 4.830541006759619}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7912638513669055, "5": 0.20391961640936018, "3": 0.004800690582800598, "2": 1.54746709956136e-05, "1": 9.274667362345959e-08}, "score": 4.199087752839041}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7628506327255414, "3": 0.23223464908152547, "5": 0.003891087879148462, "2": 0.0010224501748373807, "1": 1.0724776773720064e-06}, "score": 3.7696082962106527}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8085649008714432, "5": 0.19009032976158904, "3": 0.0013440000495683062, "2": 6.541926218707253e-07, "1": 1.859654548666405e-08}, "score": 4.188744983756361}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8040240719621023, "4": 0.19583002801414778, "3": 0.00014557152665703357, "2": 1.3131904718664225e-07, "1": 0}, "score": 4.803878396304522}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9901053751226071, "4": 0.009892642301714674, "3": 1.9193806540097753e-06, "1": 0, "2": 0}, "score": 4.990103518311568}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.97791615471277, "4": 0.022080155831767086, "3": 3.6325706219424133e-06, "1": 0, "2": 0}, "score": 4.9779125777705495}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9605834583716333, "4": 0.03940954630583313, "3": 6.9064762472502235e-06, "2": 1.7746385066349016e-08, "1": 0}, "score": 4.960576584699516}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9964880674117291, "4": 0.003511515388709116, "3": 4.483216022078784e-07, "1": 0, "2": 0}, "score": 4.996487588077399}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993349646341101, "4": 0.0006648926226801221, "3": 6.751399008668131e-08, "1": 0, "2": 0}, "score": 4.999334972299311}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9836442813311371, "4": 0.016349875440270077, "3": 5.797260961345534e-06, "2": 1.8225283565923038e-08, "1": 0}, "score": 4.983638474908049}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997629951400903, "4": 0.00023680370712222487, "3": 6.68275778188438e-08, "1": 0, "2": 0}, "score": 4.999763062605895}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8175714822272926, "4": 0.1819873135689508, "3": 0.0004405037938613691, "2": 6.669304962390558e-07, "1": 0}, "score": 4.8171296719294485}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9180239586086304, "3": 0.07371997391643215, "5": 0.0077507117587127345, "2": 0.0005043500436078325, "1": 7.995442173082855e-07}, "score": 3.9330196253158554}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9918460790342842, "4": 0.008153375220304012, "3": 5.206358416210562e-07, "1": 0, "2": 0}, "score": 4.99184558330326}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9847693230832016, "4": 0.015224224540253574, "3": 6.439369025853804e-06, "2": 8.393585951274078e-09, "1": 0}, "score": 4.9847628714706325}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8136113044385326, "5": 0.18520336266434223, "3": 0.0011771130571081258, "2": 7.785153776119404e-06, "1": 1.6682507976851734e-07}, "score": 4.184010228113636}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9164792064111152, "5": 0.06855329548156608, "3": 0.014902608712199564, "2": 6.421421206747178e-05, "1": 6.157757388545417e-07}, "score": 4.053520414197519}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.918048167219608, "5": 0.07813095889330253, "3": 0.0037931479916195206, "2": 2.695431936952293e-05, "1": 5.995796563476182e-07}, "score": 4.0742821163002345}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8011344045879503, "4": 0.19881502681811314, "3": 5.045720533774601e-05, "2": 5.312532989143398e-08, "1": 0}, "score": 4.80108388780572}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951232067598902, "4": 0.004875856000988881, "3": 9.837274106194156e-07, "1": 0, "2": 0}, "score": 4.995122176770952}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9777354955251383, "4": 0.02225826229940858, "3": 6.162413840196873e-06, "2": 3.993211298664503e-08, "1": 0}, "score": 4.977729292189541}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9554446383112695, "3": 0.0269392081911543, "5": 0.01744967945226726, "2": 0.00016582989896615742, "1": 5.320374262421435e-07}, "score": 3.9901772142496803}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9963355206523667, "4": 0.0036641917500891143, "3": 2.8396651802881965e-07, "1": 0, "2": 0}, "score": 4.9963352403035675}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8891089478185441, "4": 0.11086448271367305, "3": 2.649217901609696e-05, "2": 8.347522130225939e-08, "1": 0}, "score": 4.889082283188818}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999237573566181, "4": 7.614044214701925e-05, "3": 4.1931437207404154e-08, "1": 0, "2": 0}, "score": 4.999923775690384}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984908043828212, "4": 0.001509013278045823, "3": 1.8527956321436152e-07, "1": 0, "2": 0}, "score": 4.998490616167265}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7996793693210609, "4": 0.2002463340635483, "3": 7.41596764188729e-05, "2": 1.3726726117274702e-07, "1": 0}, "score": 4.7996049348476175}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9543562810811456, "4": 0.04560823439164656, "3": 3.535156128920421e-05, "2": 1.0050021199967548e-07, "1": 0}, "score": 4.95432075950213}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5097423892484962, "5": 0.489772392938552, "3": 0.0004837462817281019, "2": 1.3005686058605794e-06, "1": 6.510451078761524e-08}, "score": 4.489285902000959}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99947522239396, "4": 0.0005246212417628676, "3": 1.2773040565729434e-07, "1": 0, "2": 0}, "score": 4.999475123282396}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999515300767047, "4": 4.8363604512371636e-05, "3": 2.948347205300032e-08, "1": 0, "2": 0}, "score": 4.999951577424824}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9512617573383463, "4": 0.04872543041850133, "3": 1.2637765056873069e-05, "2": 2.8418514078611846e-08, "1": 0}, "score": 4.951249201675322}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9765244388445765, "4": 0.02346851132444224, "3": 6.982901778513719e-06, "2": 1.201644149907711e-08, "1": 0}, "score": 4.976517485533186}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9746977344479397, "4": 0.0252991722797314, "3": 2.9611880556610475e-06, "1": 0, "2": 0}, "score": 4.974694902001751}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994286613061452, "4": 0.0005710530188453356, "3": 2.126706738271146e-07, "1": 0, "2": 0}, "score": 4.9994285215980865}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9213564247813881, "4": 0.07859490527751523, "3": 4.858790142118223e-05, "2": 7.066503081887148e-08, "1": 0}, "score": 4.921307706029453}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6488932627366442, "5": 0.34824695850999554, "3": 0.0028579022565694574, "2": 1.8489659889919275e-06, "1": 0}, "score": 4.3453853678301835}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9389354973982036, "4": 0.06104128746961992, "3": 2.3016366687274055e-05, "2": 7.563792697473927e-08, "1": 0}, "score": 4.938912445361663}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.885966548263588, "4": 0.11399575136616366, "3": 3.7589267016738454e-05, "2": 3.8117436827252005e-08, "1": 0}, "score": 4.885928947421926}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952492976540251, "4": 0.004749518663833528, "3": 1.226482796309166e-06, "1": 0, "2": 0}, "score": 4.995248028573961}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8476091987034977, "5": 0.15180774412585604, "3": 0.0005822218484271783, "2": 8.336284812202183e-07, "1": 0}, "score": 4.1512238552766005}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9329414263584626, "5": 0.0637027593146974, "3": 0.003349383432782829, "2": 6.241237986426611e-06, "1": 7.909509296008132e-08}, "score": 4.060340662791987}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.840569912447662, "4": 0.15938462065455622, "3": 4.5252710004927206e-05, "2": 1.6253702743411636e-07, "1": 0}, "score": 4.840524378077317}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5635625212587115, "4": 0.4361257324617362, "3": 0.00031138327782195314, "2": 2.84621104239765e-07, "1": 0}, "score": 4.563250612886618}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998996803423534, "4": 0.00010024142816719027, "3": 1.9333490225286533e-08, "1": 0, "2": 0}, "score": 4.999899719898946}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9414349378993144, "5": 0.05719113929647838, "3": 0.0013718616403357497, "2": 1.9793877069424467e-06, "1": 0}, "score": 4.055815323445091}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5307190095624474, "4": 0.4691822468414339, "3": 9.853310252501846e-05, "2": 9.974359437803264e-08, "1": 0}, "score": 4.530620335738935}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.95984418018655, "4": 0.040142646742800096, "3": 1.3080604466079368e-05, "2": 2.074924451184999e-08, "1": 0}, "score": 4.959831126919745}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9230509459103335, "4": 0.07693979854502934, "3": 9.214354667051147e-06, "2": 1.5593229863465985e-08, "1": 0}, "score": 4.923041723996066}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9680409827985144, "4": 0.03195663984101653, "3": 2.337800565216382e-06, "1": 0, "2": 0}, "score": 4.968038683293466}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9842168029473993, "4": 0.015779131548944822, "3": 4.0279580409774e-06, "2": 1.5134998402844832e-08, "1": 0}, "score": 4.984212766776175}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5289304659988324, "4": 0.4707420968540164, "3": 0.00032726314039009045, "2": 1.7446878392297036e-07, "1": 0}, "score": 4.528602853676648}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.96719484066096, "4": 0.03279716500834389, "3": 7.893751980128564e-06, "2": 3.5816684665477464e-08, "1": 0}, "score": 4.967186937912602}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7087422561974038, "4": 0.29109700990327264, "3": 0.00016037239152640498, "2": 4.104872369545525e-07, "1": 0}, "score": 4.708581028125502}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999433054571963, "4": 5.6622676959523554e-05, "3": 2.4495487819106144e-09, "1": 0, "2": 0}, "score": 4.999943372420012}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997227329856052, "4": 0.00027713951896677475, "3": 1.8345050983378854e-08, "1": 0, "2": 0}, "score": 4.999722823760677}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7119116516717475, "4": 0.28336476188996734, "2": 0.004437174406746906, "5": 0.00028440991436681415, "1": 1.945536078701699e-06}, "score": 3.279492532053789}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5455581172339331, "5": 0.45387018860902356, "3": 0.0005706006386072466, "2": 9.950269646542455e-07, "1": 0}, "score": 4.453297642562438}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9339697676128794, "3": 0.06398730337941197, "5": 0.0020055264181324806, "2": 3.7231290789441066e-05, "1": 4.8338668815509194e-08}, "score": 3.937943607810674}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5030293050714781, "4": 0.49655852366810854, "3": 0.00041147470910132654, "2": 5.899989970283737e-07, "1": 0}, "score": 4.502616703919355}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8378645302341404, "5": 0.1341865879767066, "3": 0.02792945255013499, "2": 1.915235257526037e-05, "1": 0}, "score": 4.106218860131984}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5202324750019693, "4": 0.47139049124142546, "2": 0.007896841575660596, "5": 0.00047585137018631444, "1": 4.207621644292116e-06}, "score": 3.4644369990208013}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9966270591883166, "4": 0.0033718227684347932, "3": 1.150873889795618e-06, "2": 6.66190738002318e-09, "1": 0}, "score": 4.996625855631316}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7675909844747238, "4": 0.23201190360264026, "3": 0.0003963963355004842, "2": 7.371326312187526e-07, "1": 2.2423417501199694e-08}, "score": 4.767193012871066}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991258425983903, "4": 0.0008739634521020172, "3": 2.0027748639856257e-07, "1": 0, "2": 0}, "score": 4.999125635998458}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990830079943711, "4": 0.0009167176860605404, "3": 1.9014022703024764e-07, "1": 0, "2": 0}, "score": 4.999082901956285}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9703788128595658, "3": 0.023826358765197023, "5": 0.005778971230166716, "2": 1.578574879429868e-05, "1": 3.351033293011179e-08}, "score": 3.9819209397514395}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9949906521418376, "4": 0.005007722790755676, "3": 1.6286412169892857e-06, "2": 1.3059735055748966e-08, "1": 0}, "score": 4.994988980830956}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9695227188499856, "5": 0.02578182223272313, "3": 0.004692353547031138, "2": 3.0125610313000673e-06, "1": 2.5350433663858057e-08}, "score": 4.021083368934588}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991402427032805, "4": 0.000859474845503106, "3": 2.8991588725066527e-07, "1": 0, "2": 0}, "score": 4.999139945329142}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9845502879720147, "4": 0.015444381480471165, "3": 5.216640216388175e-06, "2": 1.6062893123109455e-08, "1": 0}, "score": 4.984545135538244}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8468125917737223, "4": 0.15302992323698703, "3": 0.00015623848001028136, "2": 1.0687380479100851e-06, "1": 6.757917253258687e-08}, "score": 4.846654106374658}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.928258805351596, "5": 0.06978958446830227, "3": 0.0019492628568559707, "2": 2.282669423657024e-06, "1": 1.447538813043295e-08}, "score": 4.067835716250325}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9130200801832997, "4": 0.0869396568851415, "3": 4.016092700714373e-05, "2": 7.861824812633972e-08, "1": 0}, "score": 4.91297978337102}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977919982300636, "4": 0.002207542882177199, "3": 4.2032105542870414e-07, "1": 0, "2": 0}, "score": 4.9977916163905425}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9172137195787297, "5": 0.06844368422149524, "3": 0.014210323094640216, "2": 0.00013138337263357149, "1": 7.524381773830414e-07}, "score": 4.053968344476603}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9505246991143999, "4": 0.04946656461293123, "3": 8.693134341506892e-06, "2": 2.5965944095478964e-08, "1": 0}, "score": 4.950515970370795}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997537105042387, "4": 0.00024618555936898494, "3": 2.9061661663557703e-08, "1": 0, "2": 0}, "score": 4.999753756298871}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6044146922864727, "4": 0.39532324775458344, "3": 0.00026186223843196674, "2": 1.8142091649254387e-07, "1": 0}, "score": 4.604152477053649}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998518929489324, "4": 0.000148053479721731, "3": 4.362982298493859e-09, "1": 0, "2": 0}, "score": 4.999851937787028}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9916407742612934, "4": 0.008358494097409835, "3": 6.47070230773686e-07, "1": 0, "2": 0}, "score": 4.991640211055133}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9000266949879372, "4": 0.09991477563601223, "3": 5.825326008267578e-05, "2": 2.3107973796313438e-07, "1": 2.521043098745537e-08}, "score": 4.899967921779668}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8865285133728127, "4": 0.11305502860502076, "3": 0.0004113858401623516, "2": 4.922126034323021e-06, "1": 1.1903098494954618e-07}, "score": 4.886106953679082}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8333323306622321, "5": 0.1657360527104454, "3": 0.0009303874924934066, "2": 1.0516333826156113e-06, "1": 2.1664843617276483e-08}, "score": 4.164803522639077}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995581040647816, "4": 0.00044174206922939567, "3": 1.0886187065981982e-07, "1": 0, "2": 0}, "score": 4.99955804018714}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999629731405111, "4": 3.688247691726752e-05, "3": 1.7436292972076463e-08, "1": 0, "2": 0}, "score": 4.99996308264581}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9991660623194697, "4": 0.0008337970754662852, "3": 1.1594620539483561e-07, "1": 0, "2": 0}, "score": 4.999165971011557}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9823060856633311, "5": 0.014930218986351383, "3": 0.002762286500532524, "2": 1.3844633033936908e-06, "1": 0}, "score": 4.012165163855878}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9219847782980031, "4": 0.0779941854955502, "3": 2.0993619494560187e-05, "2": 2.5732732945226883e-08, "1": 0}, "score": 4.921963748752022}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999670259236568, "4": 3.288739843033155e-05, "3": 2.1842635942819978e-08, "1": 0, "2": 0}, "score": 4.999967068914163}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999633307373339, "4": 3.663139127680815e-05, "3": 1.4170067778727082e-08, "1": 0, "2": 0}, "score": 4.999963340267718}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8533478658744771, "3": 0.14594995354149723, "5": 0.0004558036195917682, "2": 0.0002459274461212743, "1": 2.3381070545808253e-07}, "score": 3.8540132622632863}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8961313730925925, "4": 0.10381351649634678, "3": 5.496318282851589e-05, "2": 1.6651557306130813e-07, "1": 0}, "score": 4.896076059595694}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987038210665149, "4": 0.001295603071439935, "3": 5.45951332385141e-07, "2": 1.4016648994402277e-08, "1": 0}, "score": 4.998703262955338}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987076233389405, "4": 0.0012922048933641827, "3": 1.560957868281046e-07, "1": 0, "2": 0}, "score": 4.9987074828948055}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9727969724275953, "4": 0.027199608477318896, "3": 3.3297411157902417e-06, "2": 2.324604097633899e-08, "1": 0}, "score": 4.972793660503771}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9916459367566022, "4": 0.008351699732972818, "3": 2.2647300258922176e-06, "2": 6.441393102242537e-09, "1": 0}, "score": 4.991643750711189}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9394709446536336, "5": 0.04145562503890748, "3": 0.018947069560853427, "2": 0.00012563194463528115, "1": 7.298994879671724e-07}, "score": 4.022255101865894}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9976026079456001, "4": 0.002396701169130123, "3": 6.910905360370872e-07, "1": 0, "2": 0}, "score": 4.997601916650289}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8942784777042933, "4": 0.1055509398939828, "3": 0.0001695172273542719, "2": 8.722279819660705e-07, "1": 4.032061340021651e-08}, "score": 4.894107231522944}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7944915251179644, "5": 0.20148750690277803, "3": 0.004010295297903663, "2": 1.0278029491676268e-05, "1": 1.6302227321239097e-07}, "score": 4.197456212215773}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5083625829675904, "4": 0.4780509319358069, "2": 0.011683426264918315, "5": 0.0018881807115045922, "1": 1.4771602062067347e-05}, "score": 3.470114373965472}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8221302265617149, "4": 0.1775470206637416, "3": 0.00031705224085968963, "2": 5.132498398933924e-06, "1": 3.114780396250647e-07}, "score": 4.821802185729244}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9264542128127812, "4": 0.07350831131798893, "3": 3.731944699578234e-05, "2": 8.763249152094541e-08, "1": 0}, "score": 4.926416781828774}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996471999885653, "4": 0.0003526094455754912, "3": 8.585817756786027e-08, "1": 0, "2": 0}, "score": 4.9996472188011305}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7404840907315108, "4": 0.2578013633729886, "3": 0.001698795174608191, "2": 1.537175228623842e-05, "1": 2.9921124739254785e-07}, "score": 4.738753713339633}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9841575657049798, "4": 0.015839998298718475, "3": 2.3820740504592334e-06, "1": 0, "2": 0}, "score": 4.984155236698794}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9785483774002258, "4": 0.021450378244228876, "3": 1.1818140139086588e-06, "1": 0, "2": 0}, "score": 4.978547256786056}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9794327132055325, "4": 0.020564499809752362, "3": 2.7902370544156708e-06, "1": 0, "2": 0}, "score": 4.979429919783039}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999922088635248, "4": 7.778476255583074e-05, "3": 8.991384462874231e-09, "1": 0, "2": 0}, "score": 4.999922197245525}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997012861838587, "4": 0.00029858616703617546, "3": 4.418515340954546e-08, "1": 0, "2": 0}, "score": 4.999701325437728}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9687174101654412, "3": 0.024811840505782477, "5": 0.006427812505089491, "2": 4.275411969884853e-05, "1": 8.698083760202946e-08}, "score": 3.98153020104941}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9680045648137453, "5": 0.016240908560011463, "3": 0.015464255731459445, "2": 0.0002879001037436737, "1": 2.1581007618072625e-06}, "score": 4.0001943783601215}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9097030567373393, "4": 0.09027470315991354, "3": 2.214279270945843e-05, "2": 4.244991188191679e-08, "1": 0}, "score": 4.909680878950014}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980069761149135, "4": 0.0019926529248632694, "3": 3.067588202185708e-07, "1": 0, "2": 0}, "score": 4.998006733429525}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9991987945366396, "4": 0.0008010618483152792, "3": 8.598981310296792e-08, "1": 0, "2": 0}, "score": 4.999198766125888}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8992978471338343, "5": 0.09481946156693292, "3": 0.005869676836880246, "2": 1.2670976433830933e-05, "1": 2.2825874613039565e-07}, "score": 4.088923768247382}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7068425778800675, "4": 0.29292543219004163, "3": 0.0002312956027343263, "2": 6.267381544792859e-07, "1": 0}, "score": 4.706610076560095}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8055337321183788, "4": 0.19407402898511716, "3": 0.0003907645317401515, "2": 1.234817959454972e-06, "1": 0}, "score": 4.805140690819599}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988257038260017, "4": 0.001174140368985417, "3": 1.237339674314777e-07, "1": 0, "2": 0}, "score": 4.998825612125417}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9019382096319332, "4": 0.09797614973322488, "3": 8.540046604356825e-05, "2": 1.9356915464080444e-07, "1": 0}, "score": 4.901852464053585}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8232977727112099, "3": 0.17617946781396368, "5": 0.0004451425455558525, "2": 7.753237243362875e-05, "1": 4.207079678574658e-08}, "score": 3.8241104763014855}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9886652646912365, "4": 0.011333126422941748, "3": 1.566582598324642e-06, "2": 3.4555437897456374e-09, "1": 0}, "score": 4.988663729604843}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999796611748367, "4": 2.0312877772834955e-05, "3": 4.757516731006758e-09, "1": 0, "2": 0}, "score": 4.999979677606763}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995961029883677, "4": 0.000403763398031111, "3": 3.735268650909218e-08, "1": 0, "2": 0}, "score": 4.999596161857722}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9954003419773767, "4": 0.0045989052175383046, "3": 7.367486851445242e-07, "2": 5.112481163424616e-09, "1": 0}, "score": 4.995399605897301}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7940908211154488, "4": 0.17869761558906191, "2": 0.026985532228016192, "5": 0.00021846232148820254, "1": 7.538871919016971e-06}, "score": 3.1521339348050432}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5893034928729335, "4": 0.3824700230109244, "2": 0.027550902094976272, "5": 0.0006600556554893943, "1": 1.5238567624753175e-05}, "score": 3.3562088576078923}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9806539675949695, "5": 0.009823247584854904, "3": 0.009515917083089452, "2": 6.796321826454431e-06, "1": 0}, "score": 4.0002937378790895}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967900212336198, "4": 0.003206161024735734, "3": 3.852940249373237e-06, "2": 2.2726822547243485e-08, "1": 0}, "score": 4.9967860651004665}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8760690823718877, "3": 0.09147646069149357, "5": 0.028432995352648077, "2": 0.004013618802934171, "1": 7.698669779020735e-06}, "score": 3.9289061908005305}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8365275870163611, "4": 0.16339248321018918, "3": 7.958109446851988e-05, "2": 2.700680156114266e-07, "1": 0}, "score": 4.83644753153981}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6762650865087831, "4": 0.3231254632709273, "3": 0.0006073079283901427, "2": 2.0278752255318494e-06, "1": 4.236543582353611e-08}, "score": 4.675653644415316}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9411496698558847, "5": 0.037070321095039355, "3": 0.02176232097997021, "2": 1.7479461409938364e-05, "1": 1.326077916981252e-07}, "score": 4.015272644529594}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975856428599039, "4": 0.0024142381680728074, "3": 1.2371874908943084e-07, "1": 0, "2": 0}, "score": 4.9975855144058885}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6158041896044636, "5": 0.3816831556571344, "3": 0.0025023589800276845, "2": 9.793202846719256e-06, "1": 0}, "score": 4.379161400821071}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8766957746559887, "5": 0.12221493769321058, "3": 0.0010875526308375854, "2": 1.6780787838139513e-06, "1": 1.905637777624314e-08}, "score": 4.121123976324429}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.99948141775028, "4": 0.0005184095453488253, "3": 8.979756300818355e-08, "1": 0, "2": 0}, "score": 4.99948141081653}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8208382703356326, "4": 0.17906806392952657, "3": 9.346570316787767e-05, "2": 1.937603017119968e-07, "1": 0}, "score": 4.820744422259055}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999952483661937, "4": 4.7430574763769536e-05, "3": 3.135073892405371e-08, "1": 0, "2": 0}, "score": 4.999952506721175}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989712908843771, "4": 0.0010282125218483867, "3": 4.847206942696442e-07, "1": 0, "2": 0}, "score": 4.998970818024543}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9664976971558142, "4": 0.03346303775123558, "3": 3.902188169782838e-05, "2": 1.936221998560385e-07, "1": 0}, "score": 4.96645833595547}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9850133003576933, "4": 0.014982566307177175, "3": 4.042945691981453e-06, "2": 5.984991010156543e-09, "1": 0}, "score": 4.985009328581187}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9839155094465778, "4": 0.01608174180324978, "3": 2.747995008548796e-06, "1": 0, "2": 0}, "score": 4.983912762194585}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998625005539155, "4": 0.00013736251939438192, "3": 3.3118294609968007e-08, "1": 0, "2": 0}, "score": 4.99986257122975}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999458085984071, "4": 5.410997545081969e-05, "3": 2.3147779012534442e-08, "1": 0, "2": 0}, "score": 4.999945843725834}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7413692683209906, "5": 0.257692903380864, "3": 0.0009367394337916969, "2": 9.9866944393997e-07, "1": 0}, "score": 4.256754189766106}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9939822602657103, "4": 0.006017394022570877, "3": 3.0464550956883745e-07, "1": 0, "2": 0}, "score": 4.993981996439273}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9504284177400667, "4": 0.04956912593740058, "3": 2.4265380189452575e-06, "1": 0, "2": 0}, "score": 4.950426019510025}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991313138264846, "4": 0.0008685738015633845, "3": 9.73526387199916e-08, "1": 0, "2": 0}, "score": 4.999131231480112}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9275534853663459, "4": 0.07243838069194311, "3": 8.14819603997678e-06, "2": 2.080942141805878e-08, "1": 0}, "score": 4.927545263028248}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9169699840787038, "5": 0.043875745758317077, "3": 0.038937503209792126, "2": 0.00021551479424240634, "1": 1.1777390697843336e-06}, "score": 4.0045036800779945}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9005338543630594, "5": 0.0951749882662153, "3": 0.004280341426600004, "2": 1.0644843089798914e-05, "1": 1.1381790388416584e-07}, "score": 4.0908730209052155}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9992927020831809, "4": 0.0007065615076280029, "3": 6.802047371832251e-07, "1": 2.591958438811584e-08, "2": 1.8062335109522456e-08}, "score": 4.9992919202089}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959766129969272, "4": 0.0040223780360196795, "3": 9.441299701824042e-07, "2": 1.6628828353697795e-08, "1": 0}, "score": 4.995975683623549}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990143587637392, "4": 0.0009826227358875625, "3": 2.612222934702052e-06, "2": 1.9515572643287242e-07, "1": 1.489010270050268e-07}, "score": 4.999010971685418}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8347818381043532, "5": 0.12063825974707315, "3": 0.04232790575174654, "2": 0.002236469885934594, "1": 1.531782308542638e-05}, "score": 4.073791476153582}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8180670806966918, "4": 0.1817880919880144, "3": 0.00014394259265402095, "2": 8.674517033907481e-07, "1": 4.403975888570877e-08}, "score": 4.817921249186567}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.963774943237334, "5": 0.024342115029117498, "3": 0.011858124909236442, "2": 2.457116394363287e-05, "1": 1.4294212627040973e-07}, "score": 4.012434420242857}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959777965166396, "4": 0.004021624313001783, "3": 5.815202743437728e-07, "2": 4.281360517262926e-09, "1": 0}, "score": 4.995977199829045}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5538279500195219, "4": 0.445653711569327, "3": 0.0005164944576772024, "2": 1.7446344648214708e-06, "1": 3.567199178192962e-08}, "score": 4.553307894493337}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8783235019177086, "5": 0.11209117234973909, "3": 0.009535286435032432, "2": 4.971205991858496e-05, "1": 2.846461519990238e-07}, "score": 4.1024556122201465}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6048610359374911, "3": 0.36910011772305534, "2": 0.019262867499950962, "5": 0.006741323556288961, "1": 3.4308068438905155e-05}, "score": 3.5990124073991985}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.760727505111083, "4": 0.23897527124450038, "3": 0.00029544495971698537, "2": 1.5580118572286083e-06, "1": 1.1559790542883641e-07}, "score": 4.76042867723593}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995155827379468, "4": 0.0004840004120040342, "3": 2.9850892651142464e-07, "2": 1.1131654838574968e-08, "1": 0}, "score": 4.999515369123222}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7659409047986732, "5": 0.17854396599429725, "3": 0.05043166638065023, "2": 0.005031893119361773, "1": 5.0841378374616134e-05}, "score": 4.117896075106888}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6647572583511518, "4": 0.3349451137943718, "3": 0.0002967092069418949, "2": 8.724033174110681e-07, "1": 3.400844366751854e-08}, "score": 4.664458710442411}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.924215984681818, "5": 0.07236216493179246, "3": 0.003417037607192921, "2": 4.603295950787266e-06, "1": 0}, "score": 4.068935935173622}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6777778226174924, "5": 0.32193780637400654, "3": 0.000284146104393042, "2": 2.6202052409840094e-07, "1": 0}, "score": 4.321653124289954}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9895589927201169, "4": 0.0104404812588407, "3": 4.5270868400307645e-07, "1": 0, "2": 0}, "score": 4.989558612558309}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9784907386841956, "4": 0.021507533712361016, "3": 1.7631457259914513e-06, "1": 0, "2": 0}, "score": 4.978488940760738}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9726398492230364, "4": 0.027340211822564933, "3": 1.979353873569317e-05, "2": 8.713623704989468e-08, "1": 0}, "score": 4.972619938095558}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9871307304395335, "4": 0.012863209744315969, "3": 5.983008636804056e-06, "1": 0, "2": 0}, "score": 4.9871248232495}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7108675879975, "5": 0.28876657967692043, "3": 0.00036562841494546005, "2": 1.6279924841566853e-07, "1": 0}, "score": 4.288400637520027}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999871708812939, "4": 1.2730982098759549e-05, "3": 4.707353389065586e-09, "1": 0, "2": 0}, "score": 4.999987259602004}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9991060905253342, "4": 0.0008937227088274103, "3": 1.4900156912740394e-07, "1": 0, "2": 0}, "score": 4.9991059792542725}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6585904694946184, "5": 0.3398627565735568, "3": 0.0015407200606247402, "2": 6.021735808037667e-06, "1": 8.655351013448583e-08}, "score": 4.338309714970609}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8307363606486478, "4": 0.1691230030668611, "3": 0.00013994263070732125, "2": 6.823794196510711e-07, "1": 0}, "score": 4.830595062623532}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9811711566741113, "5": 0.009697079706367963, "3": 0.00912712983658188, "2": 4.657619859839392e-06, "1": 0}, "score": 4.000560634616702}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999972151525776, "4": 2.774582998151596e-05, "3": 1.462818046176503e-08, "1": 0, "2": 0}, "score": 4.999972224911212}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9986623213907058, "4": 0.0013375544095287854, "3": 1.4095643019916723e-07, "1": 0, "2": 0}, "score": 4.998662163700029}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8689460226263057, "3": 0.1210278735496142, "5": 0.009608902177870377, "2": 0.00041596393340800317, "1": 1.1144650989987638e-06}, "score": 3.887745743531064}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9302822632624357, "4": 0.06971050884887493, "3": 6.98827369521864e-06, "1": 0, "2": 0}, "score": 4.930275497896698}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7475753770038863, "3": 0.24973862700696192, "5": 0.0024864042213909913, "2": 0.00019950584975181573, "1": 1.0144957093584417e-07}, "score": 3.752348465012627}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970883434181285, "4": 0.0029114635094881634, "3": 2.0887475980033247e-07, "1": 0, "2": 0}, "score": 4.9970881187870075}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.76634879264505, "5": 0.22998906837334843, "3": 0.003642285171302597, "2": 1.95707980134766e-05, "1": 2.7577183442202964e-07}, "score": 4.22630681592908}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5940443078864119, "5": 0.40467441854804576, "3": 0.0012794543256905264, "2": 1.5580585982854358e-06, "1": 0}, "score": 4.403391953463576}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9839704479027778, "4": 0.016010469931992635, "3": 1.8937679427880634e-05, "2": 7.327986198315173e-08, "1": 0}, "score": 4.983951433726813}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5029672602333917, "4": 0.4936342601835014, "3": 0.003384205879476441, "2": 1.3317854225643491e-05, "1": 0}, "score": 4.499556896146626}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9450304554672816, "4": 0.054732439579884266, "3": 0.00023568438492610046, "2": 1.1304689628067522e-06, "1": 0}, "score": 4.94479278422782}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7416944596994219, "5": 0.24009264723134563, "3": 0.018140387008242224, "2": 7.173763877846523e-05, "1": 5.809820358126311e-07}, "score": 4.221807083574998}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8855068819195571, "5": 0.06413439984224983, "3": 0.05012916021457231, "2": 0.00022810329120426768, "1": 1.4215666782371768e-06}, "score": 4.013544768794456}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8259544931645179, "4": 0.1736351014330494, "3": 0.0004079426325260255, "2": 2.2044379048457364e-06, "1": 8.707831071489777e-08}, "score": 4.825542021798369}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8217547714541215, "4": 0.1779021142313739, "3": 0.0003425133235988772, "2": 5.021605237215848e-07, "1": 3.7156541419668425e-08}, "score": 4.821411192999433}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7323979977542736, "4": 0.266631106366499, "3": 0.0009649748684706592, "2": 5.525758692933612e-06, "1": 1.4693889747721e-07}, "score": 4.731421712173366}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.995675038400751, "4": 0.004323391998433011, "3": 1.6127657429908933e-06, "2": 1.2734156060603265e-08, "1": 0}, "score": 4.99567334450947}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8643466287073662, "3": 0.13174123780450084, "5": 0.003022592113527767, "2": 0.0008887851746186596, "1": 6.807579684926104e-07}, "score": 3.8695017318408316}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9353918655073246, "5": 0.05306187996356476, "3": 0.011498507898355683, "2": 4.703201584340539e-05, "1": 3.8742444027705116e-07}, "score": 4.041468159328188}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6237444935071658, "4": 0.3759880003741647, "3": 0.0002668662397000656, "2": 5.851802017317303e-07, "1": 1.6740749498134376e-08}, "score": 4.623476430350743}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8637421605544232, "5": 0.13393108531728287, "3": 0.0023174009533815975, "2": 9.15134220832738e-06, "1": 1.3813518912144463e-07}, "score": 4.1315949756561885}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998632156758288, "4": 0.00013669300308491106, "3": 2.4024732893698423e-08, "1": 0, "2": 0}, "score": 4.999863258938247}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8971102506971645, "5": 0.09355745868913645, "3": 0.009287328823091578, "2": 4.441035033678412e-05, "1": 2.6630461878094793e-07}, "score": 4.084180534254386}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9911928204345349, "4": 0.008803021184474638, "3": 4.084092534939328e-06, "2": 3.708475011313322e-08, "1": 0}, "score": 4.991188699048392}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8000662277925419, "4": 0.19990958293109787, "3": 2.4148217261260082e-05, "2": 2.6466924912759118e-08, "1": 0}, "score": 4.800042038315784}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997882569807182, "4": 0.00021162282397944732, "3": 3.2306415634057837e-08, "1": 0, "2": 0}, "score": 4.999788312544585}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997293301033053, "4": 0.002706126506382976, "3": 5.25271271596206e-07, "1": 0, "2": 0}, "score": 4.997292822823324}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7475557982611474, "3": 0.23554492956666398, "5": 0.011883013923013244, "2": 0.005010840567572141, "1": 5.288753357892619e-06}, "score": 3.7663005068306656}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8256805034374449, "4": 0.1738349488104106, "3": 0.0004808498494005844, "2": 3.400452659693135e-06, "1": 1.402242373957044e-07}, "score": 4.825192561751612}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7678067308832774, "5": 0.20383421237117094, "3": 0.02826040699570057, "2": 9.826919080785486e-05, "1": 1.244151350068001e-07}, "score": 4.175376938670184}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9821353049870238, "4": 0.017842862690307895, "3": 2.1243555057664754e-05, "2": 4.557903007406538e-07, "1": 7.259999383739729e-08}, "score": 4.98211299134873}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8888942272661489, "5": 0.07978697567018475, "3": 0.03090841506356192, "2": 0.00040891551011390683, "1": 1.306821114425013e-06}, "score": 4.04805681679623}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7915029124570955, "5": 0.20430207920407414, "3": 0.0041703575643539815, "2": 2.4259288087363236e-05, "1": 4.077808252079241e-07}, "score": 4.200081976460847}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6607393920727834, "5": 0.3369728889788083, "3": 0.002263552040926515, "2": 2.3562136969610966e-05, "1": 4.089965975037289e-07}, "score": 4.334661051192054}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9556168220817928, "5": 0.04103373277261287, "3": 0.0033460156473295584, "2": 3.442942755807841e-06, "1": 2.087077462231716e-08}, "score": 4.037680767334421}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9548188064200827, "4": 0.04517009618128916, "3": 1.0956353956426609e-05, "2": 3.575534744897174e-08, "1": 0}, "score": 4.954807879086507}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9793647870052461, "4": 0.020633597193255512, "3": 1.5843552749184113e-06, "2": 5.109767156559437e-09, "1": 0}, "score": 4.979363218223393}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9462520034314612, "5": 0.034919844536880955, "3": 0.018777504401523645, "2": 5.032880403127818e-05, "1": 2.8528418874894475e-07}, "score": 4.016040827212769}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999915813694369, "4": 8.386670145457929e-06, "3": 2.7704086515303794e-09, "1": 0, "2": 0}, "score": 4.999991607788791}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8853509933012041, "5": 0.11285166745216199, "3": 0.0017953451345664138, "2": 1.7487872679501575e-06, "1": 0}, "score": 4.111052851987079}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989312015723395, "4": 0.0010687206500841033, "3": 7.349415189114808e-08, "1": 0, "2": 0}, "score": 4.998931132357033}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990025803539824, "4": 0.0009973218715837765, "3": 6.081885383948306e-08, "1": 0, "2": 0}, "score": 4.999002556453847}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9510219117077728, "5": 0.04533710893732774, "3": 0.003637431420983943, "2": 3.367573845578589e-06, "1": 0}, "score": 4.041692949888396}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7825161874067564, "4": 0.21739804434253537, "3": 8.569869157328661e-05, "2": 3.215030176976472e-08, "1": 0}, "score": 4.782430453684389}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6249920995785184, "4": 0.374870655941042, "3": 0.00013717693075435114, "2": 5.543154505045251e-08, "1": 0}, "score": 4.624854819356752}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9922642104304962, "4": 0.007734979850019475, "3": 7.10839621569588e-07, "1": 0, "2": 0}, "score": 4.992263597705763}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995582232321059, "4": 0.00044159547936455215, "3": 9.181749317608899e-08, "1": 0, "2": 0}, "score": 4.999558220846123}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8355537001016181, "5": 0.16224104784329246, "3": 0.0022004425054558577, "2": 4.40686943179844e-06, "1": 0}, "score": 4.160031856040633}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6324586348283314, "5": 0.3666154134991738, "3": 0.0009227867409954174, "2": 3.155006505525519e-06, "1": 0}, "score": 4.365686320374602}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9726505580467283, "4": 0.02734676879150913, "3": 2.5352964118630964e-06, "1": 0, "2": 0}, "score": 4.972648156844796}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9744801038702512, "4": 0.025510725688914646, "3": 9.099582723984663e-06, "2": 4.5886586302861864e-08, "1": 0}, "score": 4.974470936848379}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7978076984168837, "4": 0.2017654893116857, "3": 0.00042107247055946936, "2": 5.488453698216106e-06, "1": 1.6141647673221223e-07}, "score": 4.797375236498008}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9763500881601433, "3": 0.0178300329339498, "5": 0.005804893559522259, "2": 1.4853262795219198e-05, "1": 2.1214710593141394e-08}, "score": 3.9879450891193353}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9559738938422394, "4": 0.04401897887478944, "3": 7.148185569257121e-06, "2": 6.907997766381304e-09, "1": 0}, "score": 4.955966705254672}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.501433942548361, "5": 0.4982211620693897, "3": 0.00034448052510787535, "2": 3.8399588521578106e-07, "1": 0}, "score": 4.497875928917588}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999590395729012, "4": 4.088221216122531e-05, "3": 9.733551521490935e-09, "1": 0, "2": 0}, "score": 4.999959098317935}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9979358532869436, "4": 0.0020640663201983355, "3": 1.0924672287370249e-07, "1": 0, "2": 0}, "score": 4.99793571524592}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9978892066640683, "4": 0.002110305616583601, "3": 5.026805289199064e-07, "1": 0, "2": 0}, "score": 4.997888689053946}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9273864387519309, "5": 0.06874483998608909, "3": 0.0038629698505537992, "2": 5.679621299938307e-06, "1": 5.798154886668697e-08}, "score": 4.064870337844056}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9890176373497374, "4": 0.010977818961696808, "3": 4.486175504125032e-06, "2": 1.5725157791101192e-08, "1": 0}, "score": 4.989013161052704}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9391366905757511, "4": 0.06084093764842448, "3": 2.2124831122074494e-05, "2": 8.290387772203709e-08, "1": 0}, "score": 4.93911455399}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999960112362533, "4": 3.984877075517232e-05, "3": 7.3852726663457834e-09, "1": 0, "2": 0}, "score": 4.999960136457444}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6496274982374788, "4": 0.3464389036990385, "2": 0.003500613640490925, "5": 0.0004323073778204201, "1": 6.794718715620825e-07}, "score": 3.343801545036142}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954092046633163, "4": 0.0045900759876644276, "3": 6.755119426389988e-07, "1": 0, "2": 0}, "score": 4.995408572787175}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5439730357449356, "4": 0.45564875974061453, "3": 0.00037760495553896704, "2": 5.355481688161733e-07, "1": 0}, "score": 4.54359439448894}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979411954514522, "4": 0.0020585687895381126, "3": 1.7598395690709364e-07, "1": 0, "2": 0}, "score": 4.997941079119476}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996634024416733, "4": 0.00033653648156537603, "3": 2.8009922907465895e-08, "1": 0, "2": 0}, "score": 4.999663407487458}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7696385961235234, "4": 0.23003198833781505, "3": 0.00032845786273575235, "2": 6.554007213871815e-07, "1": 6.819053941325396e-08}, "score": 4.76930880297112}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5140782951154148, "5": 0.48097936981196593, "3": 0.004926011227764748, "2": 1.571817298571982e-05, "1": 3.7153119720080345e-07}, "score": 4.476020919100495}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9776704293930106, "5": 0.012885611212896851, "3": 0.009438685088491912, "2": 5.13632610308978e-06, "1": 0}, "score": 4.003436653946387}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6679641330005281, "4": 0.33169586473153967, "3": 0.00033906365342321307, "2": 5.15481201856537e-07, "1": 0}, "score": 4.667624320878788}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9769962150500807, "4": 0.022995031686907627, "3": 8.66179137973077e-06, "2": 1.8416110219479957e-08, "1": 0}, "score": 4.97698758780082}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"4": 0.873011980385637, "5": 0.11968484291997762, "3": 0.007280643702568022, "2": 2.2329720700612307e-05, "1": 1.1423729692567061e-07}, "score": 4.112359207067887}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6788795570500362, "4": 0.32042318619656407, "3": 0.0006929565216945941, "2": 3.8669827738647195e-06, "1": 1.7209658104870767e-07}, "score": 4.678178527380967}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9802381055321195, "4": 0.019759418800996867, "3": 2.4780366121191137e-06, "2": 7.090584923619556e-09, "1": 0}, "score": 4.980235604041002}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999101692710216, "4": 8.977221862076156e-05, "3": 1.853939332195963e-08, "1": 0, "2": 0}, "score": 4.999910190699003}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9153470921071124, "4": 0.08461375812508891, "3": 3.895914597460058e-05, "2": 1.8718264229220404e-07, "1": 0}, "score": 4.915307761743763}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6824777453503054, "3": 0.3062696977524247, "2": 0.008538102376752456, "5": 0.0027063159418685874, "1": 8.048281239110118e-06}, "score": 3.6793362396371143}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9580985938219109, "5": 0.03642618845425183, "3": 0.00546857942063573, "2": 6.426650969231069e-06, "1": 0}, "score": 4.030944762281205}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6567681465267252, "5": 0.34271280011885075, "3": 0.0005185425863065868, "2": 4.6742262964478995e-07, "1": 0}, "score": 4.342193337519822}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9128243633535356, "4": 0.08713300801816617, "3": 4.246834852836238e-05, "2": 1.3762145508763365e-07, "1": 0}, "score": 4.912781640444192}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9164703019424038, "4": 0.08351000783465796, "3": 1.9568567069669277e-05, "2": 4.895447756189988e-08, "1": 0}, "score": 4.916450702093619}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7022033250988814, "3": 0.2878913865535495, "2": 0.006713819935783342, "5": 0.003184458564042342, "1": 7.043706745579255e-06}, "score": 3.701844311113943}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8512303461569403, "5": 0.14819953555973406, "3": 0.0005685481794452884, "2": 1.4126516738129754e-06, "1": 0}, "score": 4.147628185321325}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8756043721736665, "5": 0.12239967061028198, "3": 0.001993953355785892, "2": 1.976648152547675e-06, "1": 0}, "score": 4.120401767234577}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8795544821430045, "4": 0.12041423767309108, "3": 3.115655193051785e-05, "2": 6.945151178641775e-08, "1": 0}, "score": 4.8795232343410255}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9616846968432591, "4": 0.03831222282101131, "3": 2.938788900761969e-06, "1": 0, "2": 0}, "score": 4.961681894177381}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7973167111634989, "4": 0.20224527206581772, "3": 0.0004353705719444749, "2": 2.2593802679632683e-06, "1": 1.5377597522138053e-07}, "score": 4.796876546209193}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8488745463173338, "4": 0.15061088329384975, "3": 0.0005134122650297843, "2": 7.599835869634175e-07, "1": 0}, "score": 4.848359951851331}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9788221949464906, "4": 0.02113614861201147, "3": 4.1575687360387664e-05, "2": 4.463721092963966e-08, "1": 0}, "score": 4.978780565335255}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979155594697793, "4": 0.0020836669098317725, "3": 7.327252754943135e-07, "1": 0, "2": 0}, "score": 4.9979148675543446}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9852185285702955, "4": 0.01477368679268201, "3": 7.727949467190973e-06, "2": 1.633795350255495e-08, "1": 0}, "score": 4.985210807697785}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8346325757620072, "5": 0.1630755155298087, "3": 0.00228782658867487, "2": 3.8910519995230496e-06, "1": 6.228133841037375e-08}, "score": 4.1607797406993265}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9631090285417118, "4": 0.036884443580909865, "3": 6.4210172670705435e-06, "2": 1.5481439223689588e-08, "1": 0}, "score": 4.963102664568608}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.975236221370721, "3": 0.014631529850572233, "5": 0.010114957601674817, "2": 1.7184873650544134e-05, "1": 7.394605470928696e-08}, "score": 3.9954488360183738}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.834352728653712, "4": 0.16552109997423844, "3": 0.00012570495800344385, "2": 2.4525336939050034e-07, "1": 0}, "score": 4.834226717687116}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9828172977615718, "4": 0.01717801346134063, "3": 4.628572744110219e-06, "1": 0, "2": 0}, "score": 4.9828127283584225}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8338099335650222, "5": 0.1640056828883607, "3": 0.0021796521045173026, "2": 4.3466070748570864e-06, "1": 0}, "score": 4.161817399842697}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8135498384263901, "5": 0.18552632374896252, "3": 0.0009229323682328334, "2": 8.500488657473126e-07, "1": 0}, "score": 4.184601701511327}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9097094738053345, "5": 0.08594932505047445, "3": 0.004336301860473881, "2": 4.652508599828544e-06, "1": 0}, "score": 4.081603738310573}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9500795357974309, "5": 0.035295051817852335, "3": 0.01433108965367222, "2": 0.00029207965552598516, "1": 1.93613469048184e-06}, "score": 4.020374000702669}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8422274841752262, "5": 0.14734115481529092, "3": 0.01024781875944787, "2": 0.000181565334379431, "1": 1.6584966474439936e-06}, "score": 4.1367252734330675}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6994333582258846, "4": 0.28804559367632104, "2": 0.010987533138029592, "5": 0.0015095132969684007, "1": 2.3565353420825116e-05}, "score": 3.2800300786051357}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5902361015566318, "5": 0.4072949349821943, "3": 0.002465964426332391, "2": 2.493552892583819e-06, "1": 0}, "score": 4.404824188081395}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.878648243001624, "3": 0.10255557830397036, "5": 0.018570832021816048, "2": 0.0002243442175749307, "1": 7.734521736015415e-07}, "score": 3.915564225590143}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8244894769592106, "5": 0.11321827345046628, "3": 0.06173784283641354, "2": 0.000551367776780724, "1": 2.792221618390252e-06}, "score": 4.050369330824545}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9094095647477607, "5": 0.07619325022022737, "3": 0.01436338527156375, "2": 3.273521985132963e-05, "1": 8.79033349243244e-07}, "score": 4.061761768866168}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8464650719372898, "5": 0.15166791772455307, "3": 0.001860332581468514, "2": 6.541434984325037e-06, "1": 9.532211467057322e-08}, "score": 4.149794222448273}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959764974636468, "4": 0.004022369991271655, "3": 1.1565871516590684e-06, "2": 7.191255952567173e-09, "1": 0}, "score": 4.995975295386361}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9936935337615658, "4": 0.006305065002143999, "3": 1.4205477802474606e-06, "2": 6.261995078334164e-09, "1": 0}, "score": 4.993692075277626}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999480733442354, "4": 5.184733618595061e-05, "3": 3.82107097759735e-08, "1": 0, "2": 0}, "score": 4.99994807624026}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921851251633913, "4": 0.0078085811700634045, "3": 6.222399213146006e-06, "2": 4.930107257742723e-08, "1": 0}, "score": 4.99217882595649}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9519017588509358, "5": 0.03447255082106467, "3": 0.013600958646651074, "2": 2.4585911065693264e-05, "1": 1.297108622622616e-07}, "score": 4.020822031554085}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7484365337250023, "3": 0.22865807809066543, "5": 0.012133654786083067, "2": 0.010763569944999768, "1": 8.097388141105369e-06}, "score": 3.7619241289124865}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8928662940710067, "4": 0.1068663276300108, "3": 0.0002664339999504764, "2": 7.008394542753946e-07, "1": 0}, "score": 4.892598675703844}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9150573299375012, "3": 0.05140264236309708, "5": 0.03263813137713746, "2": 0.0008977629500097436, "1": 4.064560251618221e-06}, "score": 3.9794277680176497}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7400471859644402, "5": 0.2570151105245381, "3": 0.002932460345351075, "2": 5.154744527084145e-06, "1": 5.540788083338596e-08}, "score": 4.254072182854243}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9039373627354615, "5": 0.0900105313947886, "3": 0.006036016527052588, "2": 1.5433671103866492e-05, "1": 3.060191975103449e-07}, "score": 4.083942758818722}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945336581173797, "4": 0.005464317777523733, "3": 1.94914255008113e-06, "2": 1.1900731120722862e-08, "1": 0}, "score": 4.9945317478903455}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9692606990583925, "4": 0.030720573569340347, "3": 1.8576021046782243e-05, "2": 4.656610132057155e-08, "1": 0}, "score": 4.969242131467294}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997839702377902, "4": 0.00021583679814631096, "3": 9.257080738677625e-08, "1": 0, "2": 0}, "score": 4.999783978038552}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951194291798551, "4": 0.004879363002069395, "3": 1.1785248837837153e-06, "2": 6.9297922676636105e-09, "1": 0}, "score": 4.9951182590496135}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7880873066661405, "5": 0.20800108145322177, "3": 0.003889023037759595, "2": 2.211567333778208e-05, "1": 3.8502560437494124e-07}, "score": 4.204066689979214}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8726415439850583, "4": 0.12732744545435914, "3": 3.092211296705023e-05, "2": 1.0601025523649297e-07, "1": 0}, "score": 4.872610394526239}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9557789371127201, "5": 0.040870007414061896, "3": 0.0033474965868872143, "2": 3.4573885783518045e-06, "1": 2.087653575111211e-08}, "score": 4.037515536444959}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6150303886237685, "5": 0.38422338260394856, "3": 0.000743920339074597, "2": 2.059859049657641e-06, "1": 3.3765272616996056e-08}, "score": 4.3834753236248645}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.995801038394945, "4": 0.004198611095210049, "3": 3.3107364297051583e-07, "2": 1.4871519337608655e-09, "1": 0}, "score": 4.995800722220675}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9217293824048107, "4": 0.07822640723559969, "3": 4.404454719341131e-05, "2": 1.293507668297372e-07, "1": 0}, "score": 4.921685112762224}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9982267894987035, "4": 0.0017729022250971632, "3": 2.782939243360947e-07, "1": 0, "2": 0}, "score": 4.998226541133882}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6257362515914471, "4": 0.3740748903633671, "3": 0.00018860550489280064, "2": 1.321902056025509e-07, "1": 0}, "score": 4.625547456990835}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992380680876479, "4": 0.000761842664980773, "3": 5.341287581040446e-08, "1": 0, "2": 0}, "score": 4.999238050481964}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9783937290721127, "4": 0.021603455505078927, "3": 2.8492578531437795e-06, "2": 6.3142932719729225e-09, "1": 0}, "score": 4.9783908279039295}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9251781180064845, "3": 0.06507178069583881, "5": 0.00951101764750461, "2": 0.00023837035031301328, "1": 6.512250861776466e-07}, "score": 3.9439605390971444}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.90482988077166, "4": 0.0951439948200937, "3": 2.5923128382339704e-05, "2": 9.628011784982886e-08, "1": 0}, "score": 4.904803860087217}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.567414841453131, "4": 0.43217228602441177, "3": 0.0004120445843614385, "2": 8.274095837627676e-07, "1": 2.351458429490866e-08}, "score": 4.567001058472723}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997733634559426, "4": 0.00022645824020392751, "3": 6.181350307440639e-08, "1": 0, "2": 0}, "score": 4.999773418106394}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998120929467422, "4": 0.0001878394404864352, "3": 3.2333920095250785e-08, "1": 0, "2": 0}, "score": 4.999812095885044}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9661619748475674, "5": 0.021364075126736645, "3": 0.012464097093115238, "2": 9.737929888636661e-06, "1": 3.602736674230702e-08}, "score": 4.008880394793076}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9950242840907619, "4": 0.004975616482341487, "3": 1.0797166557829623e-07, "1": 0, "2": 0}, "score": 4.995024167616846}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6361318536941974, "4": 0.3636161502630844, "3": 0.0002518628159079039, "2": 1.249506472008742e-07, "1": 0}, "score": 4.635879746239639}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971204662333419, "4": 0.00287945280831174, "3": 8.347271708318359e-08, "1": 0, "2": 0}, "score": 4.997120380253495}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9474740426697787, "4": 0.052519628661149655, "3": 6.261868092735406e-06, "1": 0, "2": 0}, "score": 4.947467844093466}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6949306656837361, "4": 0.3049455020937595, "3": 0.00012343448851585747, "2": 3.5846098904375003e-07, "1": 2.947386200763351e-08}, "score": 4.694806432660161}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9958646437322315, "4": 0.004134152207267011, "3": 1.2056966804992363e-06, "2": 1.1781327194515205e-08, "1": 0}, "score": 4.995863401110894}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8235935379185061, "4": 0.17635774586772532, "3": 4.8530650041726635e-05, "2": 1.225435941078832e-07, "1": 0}, "score": 4.8235448140811785}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999155329675407, "4": 8.42983724319418e-05, "3": 4.471351643225648e-08, "1": 0, "2": 0}, "score": 4.999915612190075}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989470242684183, "4": 0.0010528052612687301, "3": 1.0611557570289986e-07, "1": 0, "2": 0}, "score": 4.998946982439813}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7537167083068209, "4": 0.24599691100963866, "3": 0.00028575521649654704, "2": 5.74984932983118e-07, "1": 0}, "score": 4.753429841155187}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8068468707148132, "5": 0.19169555815744552, "3": 0.0014547270361196468, "2": 2.7629903627363427e-06, "1": 2.6893452001195196e-08}, "score": 4.190235234772479}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8211677059902427, "4": 0.1786826592245697, "3": 0.0001492272867279248, "2": 3.357422783568772e-07, "1": 1.620879241941517e-08}, "score": 4.821017804197976}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5429319441283564, "5": 0.45603012867257614, "3": 0.0010352723984336336, "2": 2.4723609837622355e-06, "1": 0}, "score": 4.454989994560391}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9988549609580597, "4": 0.0011446538523953345, "3": 3.435528086939683e-07, "1": 0, "2": 0}, "score": 4.998854658994299}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9996348072491118, "4": 0.0003650240193896324, "3": 9.344629039317077e-08, "1": 0, "2": 0}, "score": 4.999634789060535}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998965813680755, "4": 0.00010338289862937785, "3": 8.739918257600444e-09, "1": 0, "2": 0}, "score": 4.999896599618744}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991203676535549, "4": 0.0008794634080965994, "3": 7.177195758965003e-08, "1": 0, "2": 0}, "score": 4.99912039296252}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.993663529240838, "4": 0.0063359995214420164, "3": 4.85965112792554e-07, "1": 0, "2": 0}, "score": 4.9936630286416595}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9960014431029941, "4": 0.003998026158615485, "3": 5.172823396468445e-07, "1": 0, "2": 0}, "score": 4.996000939222894}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8498921414169076, "3": 0.14756916468337952, "5": 0.001916461043975761, "2": 0.0006213713920272563, "1": 7.560328570537509e-07}, "score": 3.8531022699904174}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6438935767676655, "4": 0.34071473706391264, "2": 0.015095946725040246, "5": 0.0002899617616664932, "1": 5.5940277641230235e-06}, "score": 3.326187585712316}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5605295371496365, "4": 0.43882488969684236, "3": 0.0006441551143952831, "2": 1.4010242243532028e-06, "1": 1.5225685495942177e-08}, "score": 4.559882535311487}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6017588772734116, "4": 0.39726220115118954, "3": 0.0009697696392308234, "2": 8.728308186176532e-06, "1": 1.6630024125948923e-07}, "score": 4.600771306712207}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5887197235158375, "3": 0.37069231503325395, "2": 0.038432235707428763, "5": 0.0021243487376059133, "1": 3.08340487401479e-05}, "score": 3.5544748182421984}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6337108633921077, "4": 0.3661053300359616, "3": 0.0001837124122463415, "2": 7.015280818862164e-08, "1": 0}, "score": 4.633527025883249}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9352082193445843, "5": 0.05807002901167348, "3": 0.00671600631147708, "2": 5.715327254369831e-06, "1": 2.175663648948158e-08}, "score": 4.051342527199271}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6150976274210584, "5": 0.3843035015313294, "3": 0.0005987338395000335, "2": 1.4298101181694971e-07, "1": 0}, "score": 4.383704479514718}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999380608083109, "4": 6.189822834049763e-05, "3": 5.345990480010371e-09, "1": 0, "2": 0}, "score": 4.999938091077474}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9534182618000546, "5": 0.04500020201498523, "3": 0.001579890086293639, "2": 1.621105879414332e-06, "1": 1.8865801468820548e-08}, "score": 4.043417013385544}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9562510010426045, "5": 0.03389036578905211, "3": 0.009833355992353422, "2": 2.5068060805060793e-05, "1": 7.539257813501363e-08}, "score": 4.0240066507075865}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5992493442216941, "4": 0.40045737003469356, "3": 0.0002929279159100785, "2": 3.7515783732351017e-07, "1": 0}, "score": 4.598955655610127}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7928410966192615, "4": 0.20703690843339645, "3": 0.00012173828772658464, "2": 2.348342243574541e-07, "1": 0}, "score": 4.792718905964486}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9820159621741024, "4": 0.01797671445412315, "3": 7.21102105636456e-06, "2": 7.13899309967468e-08, "1": 0}, "score": 4.98200864859703}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6344594198374026, "4": 0.3652696978614544, "3": 0.0002686734113931129, "2": 1.939054645093583e-06, "1": 8.684473220868254e-08}, "score": 4.634186723832587}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"5": 0.586263225492869, "4": 0.4133729776422415, "3": 0.00036331377613838, "2": 3.4201884467942644e-07, "1": 0}, "score": 4.585899310331802}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8777704201552391, "4": 0.12220520977134659, "3": 2.429733219156703e-05, "2": 1.672358229742922e-08, "1": 0}, "score": 4.877746138545151}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7354842155602203, "4": 0.26439959573392685, "3": 0.00011613282253987864, "2": 6.16421467425023e-08, "1": 0}, "score": 4.735367955218525}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967001213070951, "4": 0.0032992318840901437, "3": 6.374566896663367e-07, "1": 0, "2": 0}, "score": 4.996699493171665}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997377449448706, "4": 0.0002620167827387292, "3": 1.2594796392737186e-07, "1": 0, "2": 0}, "score": 4.999737731291874}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9748070295334083, "3": 0.018069153880820636, "5": 0.0071104410837184925, "2": 1.3121282863476718e-05, "1": 9.33907063882681e-08}, "score": 3.989014762698313}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9984312557676207, "4": 0.001568298978760847, "3": 3.827510726234015e-07, "1": 0, "2": 0}, "score": 4.998430935421024}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9600342289496497, "5": 0.03725425919081304, "3": 0.0027081622788702954, "2": 3.298894980374739e-06, "1": 3.172445507533058e-08}, "score": 4.034539404603527}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.884605390368905, "4": 0.1153757598806109, "3": 1.8784603245046724e-05, "2": 4.373631819602744e-08, "1": 0}, "score": 4.8845865372328365}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5924694905744474, "5": 0.4062948708964847, "3": 0.0012302519416044566, "2": 5.245505202357664e-06, "1": 7.325150816338225e-08}, "score": 4.405053935665066}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8419362501643685, "5": 0.1566996285619196, "3": 0.0013590029134451676, "2": 4.984582047956039e-06, "1": 6.852515039592685e-08}, "score": 4.1553304610447155}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998317543748829, "4": 0.00016817171289242185, "3": 3.51437163986562e-08, "1": 0, "2": 0}, "score": 4.999831757993153}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5749183202581758, "4": 0.42479881440796696, "3": 0.00028193810413509835, "2": 8.914272562499261e-07, "1": 0}, "score": 4.574634619872864}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998013666902087, "4": 0.00019844749532580647, "3": 5.5465645935605897e-08, "1": 0, "2": 0}, "score": 4.9998014415475}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998495092248729, "4": 0.00015039340457047718, "3": 1.4221058186134794e-08, "1": 0, "2": 0}, "score": 4.999849578140806}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8946229628726441, "5": 0.10170711680083869, "3": 0.0036637007812902462, "2": 5.895489446649891e-06, "1": 9.396748676380767e-08}, "score": 4.098031365694065}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9513053413454353, "4": 0.04868038997036361, "3": 1.4132930318521343e-05, "2": 4.571908551861113e-08, "1": 0}, "score": 4.9512912026262565}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7625614527329049, "5": 0.23656194061323307, "3": 0.0008758985361929659, "2": 6.290752204720676e-07, "1": 0}, "score": 4.235684802555704}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5055298458647234, "4": 0.4940491365699072, "3": 0.00041960867802285517, "2": 1.37194516041833e-06, "1": 0}, "score": 4.505107511956155}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5313584172688596, "4": 0.4681848604946154, "3": 0.00045480295443036994, "2": 1.7128601197714694e-06, "1": 6.62547948238088e-08}, "score": 4.5309000642445705}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9651290683512906, "4": 0.03484992827095363, "3": 2.0762460198841835e-05, "2": 1.3460422916287582e-07, "1": 2.0321670661953332e-08}, "score": 4.9651080587088625}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9956843781751186, "4": 0.004309001811281792, "3": 6.429601479116159e-06, "2": 1.897707637082287e-07, "1": 5.8303891281152575e-08}, "score": 4.99567733670716}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991696318066366, "4": 0.0008293228778059092, "3": 9.814831411449328e-07, "2": 1.3914560876921416e-08, "1": 0}, "score": 4.999168672370732}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999269246830243, "4": 0.0007304987777090787, "3": 2.1712274460083814e-07, "1": 0, "2": 0}, "score": 4.9992690669495605}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7859189334314179, "4": 0.21389207790968548, "3": 0.0001885302663074444, "2": 3.429932737606533e-07, "1": 0}, "score": 4.785729807851245}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7548279473555266, "5": 0.15350124519012534, "3": 0.09018452768976357, "2": 0.0014714243525573573, "1": 1.4833758425083795e-05}, "score": 4.060329368826321}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8847288191231589, "4": 0.11494812952271867, "3": 0.00032056227330302023, "2": 2.4257592252442537e-06, "1": 5.812249911168865e-08}, "score": 4.884403235562005}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7273307885855441, "5": 0.2707070335167346, "3": 0.001956089405657998, "2": 5.9779730638056e-06, "1": 8.096936205999519e-08}, "score": 4.268738753197995}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999950338100193, "4": 4.9512569070789673e-05, "3": 1.9475160575729444e-08, "1": 0, "2": 0}, "score": 4.9999504484741735}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8452004337907583, "4": 0.15473280318842828, "3": 6.652830910901079e-05, "2": 2.0182254817724842e-07, "1": 0}, "score": 4.84513352963228}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7440834771296249, "4": 0.25577285846042763, "3": 0.00014350323205311718, "2": 2.2775895093453296e-07, "1": 0}, "score": 4.743939468847393}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9928094883260195, "4": 0.007189950441292416, "3": 5.488701194606171e-07, "1": 0, "2": 0}, "score": 4.992808951729569}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.511450230193018, "5": 0.4881036979030659, "3": 0.00044574625625999316, "2": 2.8365333380734945e-07, "1": 0}, "score": 4.487657404818981}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7194555022111163, "4": 0.28046674982331415, "3": 7.761234953071694e-05, "2": 5.963429553088355e-08, "1": 0}, "score": 4.719377825252576}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999910407653634, "4": 8.943995962299064e-05, "3": 3.224180288889712e-08, "1": 0, "2": 0}, "score": 4.999910495546018}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.559185454313752, "5": 0.4402998970668669, "3": 0.0005143065857479903, "2": 2.8233444317725084e-07, "1": 0}, "score": 4.439785052067043}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9271620708379642, "5": 0.06862799754730105, "3": 0.004194943112254875, "2": 1.4528344842230912e-05, "1": 2.592118904165003e-07}, "score": 4.064403233051246}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6012952142342312, "4": 0.3983364814874869, "3": 0.0003677741614106981, "2": 5.071566026919233e-07, "1": 0}, "score": 4.600926439557048}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979959306340282, "4": 0.0020034617893881375, "3": 5.409716296759649e-07, "1": 0, "2": 0}, "score": 4.9979954561338396}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9727651527590407, "4": 0.027227883556887038, "3": 6.814928393915718e-06, "2": 1.3708976495838843e-08, "1": 0}, "score": 4.972758441780512}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.967625713582344, "5": 0.02873867794244902, "3": 0.0036342173524353955, "2": 1.3367623825297632e-06, "1": 0}, "score": 4.025101788429792}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9983889599205464, "4": 0.001610703884799893, "3": 3.244413684078361e-07, "1": 0, "2": 0}, "score": 4.998388647213525}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5816921925130514, "4": 0.41803843538615687, "3": 0.0002690670373312745, "2": 1.9528906332339057e-07, "1": 0}, "score": 4.581422798722931}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9371161640389509, "4": 0.06287478311697452, "3": 8.938354912261326e-06, "2": 2.2194884556568072e-08, "1": 0}, "score": 4.937107267783909}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5638883545527498, "5": 0.43573418020128335, "3": 0.0003767924698259909, "2": 6.202091978078982e-07, "1": 0}, "score": 4.435356170198404}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9982531621004467, "4": 0.0017466772677730477, "3": 9.178215024516683e-08, "1": 0, "2": 0}, "score": 4.998253139047657}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.818876188950121, "4": 0.1808023198640333, "3": 0.00031747134362629696, "2": 3.5559048438248424e-06, "1": 1.3987313552264232e-07}, "score": 4.818551451440656}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8671620593529362, "5": 0.12361931202583419, "3": 0.009194052236761334, "2": 2.43529637807636e-05, "1": 9.041261796768602e-08}, "score": 4.114376297836628}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991107317036185, "4": 0.0008891941098468761, "3": 7.08527540503944e-08, "1": 0, "2": 0}, "score": 4.99911066418168}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9581060344444824, "3": 0.025314738587527825, "5": 0.016097842857090955, "2": 0.00047806086545078616, "1": 2.9850860024312353e-06}, "score": 3.989818023837523}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9102939860964203, "3": 0.08614837315946698, "5": 0.003220166218841164, "2": 0.0003366320714992686, "1": 5.996576067696113e-07}, "score": 3.9163967096449968}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995688277314909, "4": 0.00043105813196786595, "3": 9.878204297268198e-08, "1": 0, "2": 0}, "score": 4.999568744297324}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.996315396073699, "4": 0.003682657281561921, "3": 1.8895364944518306e-06, "2": 2.598799854280424e-08, "1": 0}, "score": 4.996313485566728}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9669101249392404, "4": 0.03308357643330399, "3": 6.090228234593294e-06, "1": 0, "2": 0}, "score": 4.966904236213096}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6805678198933681, "4": 0.31922464747089485, "3": 0.00020535199551099202, "2": 1.8724552881456336e-06, "1": 9.661363080892064e-08}, "score": 4.680358577090742}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9497652216839314, "5": 0.041295167316093936, "3": 0.008930347241708048, "2": 9.212622531199598e-06, "1": 4.445888533109794e-08}, "score": 4.032346261668639}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.990373187315059, "4": 0.009625893229974484, "3": 8.976289949032516e-07, "1": 0, "2": 0}, "score": 4.990372311301902}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8175669365424885, "4": 0.18232506748065375, "3": 0.00010790115299321025, "2": 9.545651819519165e-08, "1": 0}, "score": 4.81745884395929}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8612494975936354, "4": 0.13866325653320458, "3": 8.709796833831185e-05, "2": 9.56661797106915e-08, "1": 0}, "score": 4.861162253278884}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8925228798238107, "4": 0.10746343809600825, "3": 1.3598881653006987e-05, "2": 1.4373652410699638e-08, "1": 0}, "score": 4.892509313621696}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8658133455217651, "5": 0.11627122157410649, "3": 0.017803788629113856, "2": 0.00010964321102213479, "1": 1.4822564542625834e-06}, "score": 4.098243750723184}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8499941090935221, "4": 0.14916060017205093, "3": 0.0008415257034491125, "2": 3.6717726559145933e-06, "1": 1.4471059290652148e-07}, "score": 4.849144762022557}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6695875454265102, "4": 0.3191060456294816, "3": 0.011150763590142939, "2": 0.00015097534690627099, "1": 4.027841231887946e-06}, "score": 4.6581231702430035}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9707509342214768, "4": 0.029100166010290016, "3": 0.00014669939454325942, "2": 1.990660628895119e-06, "1": 1.5507080777264348e-07}, "score": 4.970599841329015}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7211807857952823, "4": 0.27519198434513226, "3": 0.003592047158033083, "2": 3.395776538738094e-05, "1": 7.684410383062019e-07}, "score": 4.717518845327215}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8600097264267434, "4": 0.1399305011482305, "3": 5.961186062001807e-05, "2": 1.38533868958187e-07, "1": 0}, "score": 4.859949856443542}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.923373137677529, "5": 0.07064446619175042, "3": 0.005958703232607844, "2": 2.348647111090123e-05, "1": 7.135988216152087e-08}, "score": 4.064638584667822}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8175822415387949, "5": 0.18196298349162857, "3": 0.0004542590172645201, "2": 4.482252234244947e-07, "1": 1.5698275050863205e-08}, "score": 4.181507790372727}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971129962336384, "4": 0.0028868232583662314, "3": 1.4097123140138762e-07, "1": 0, "2": 0}, "score": 4.997112894685024}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9960771389017481, "4": 0.003922333192790072, "3": 5.063564343154573e-07, "2": 6.033895589831728e-09, "1": 0}, "score": 4.996076635931782}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8316845139795782, "5": 0.1666045731077131, "3": 0.0017091577049923898, "2": 1.6133012701101495e-06, "1": 0}, "score": 4.164892212199448}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999637428784835, "4": 0.00036239155030597873, "3": 9.538953123459271e-08, "1": 0, "2": 0}, "score": 4.999637417640074}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993788968644571, "4": 0.0006208127818419233, "3": 2.1676392041067696e-07, "1": 0, "2": 0}, "score": 4.999378753644599}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979315783384918, "4": 0.002067891065459988, "3": 5.280282768679508e-07, "1": 0, "2": 0}, "score": 4.997931052872674}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9810125759284631, "4": 0.01898400872976925, "3": 3.4602144190190445e-06, "2": 9.217407694760309e-09, "1": 0}, "score": 4.981009044216392}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8982413885082075, "4": 0.1016926245692906, "3": 6.571022584923922e-05, "2": 2.200251453676032e-07, "1": 0}, "score": 4.898175289133015}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9577952446053261, "4": 0.042168473946915266, "3": 3.616112178884144e-05, "2": 6.719835962886441e-08, "1": 0}, "score": 4.957758999970265}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7003903195376354, "5": 0.2981229779262053, "3": 0.0014854166109186501, "2": 1.2203315180818748e-06, "1": 3.19084491049909e-08}, "score": 4.296635034919136}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987365162685456, "4": 0.0012624234907970076, "3": 9.866948643220472e-07, "1": 0, "2": 0}, "score": 4.998735603026483}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9946855474360486, "4": 0.005312061443239469, "3": 2.3787985706127484e-06, "2": 1.2102933206026189e-08, "1": 0}, "score": 4.994683144649655}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8464154366807913, "5": 0.1504727762289128, "3": 0.0031044624580031242, "2": 7.151209891351942e-06, "1": 1.1998297250790256e-07}, "score": 4.147353659276705}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9983372716669641, "4": 0.0016623836048591913, "3": 2.8849646618463986e-07, "1": 0, "2": 0}, "score": 4.998337039308698}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9912652059244192, "4": 0.008732537386386333, "3": 2.1747300849458516e-06, "1": 0, "2": 0}, "score": 4.991263112437376}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9780195797044704, "4": 0.021976266574653874, "3": 4.147826897604345e-06, "2": 1.8671640780357532e-08, "1": 0}, "score": 4.97801538203754}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9232069879380149, "4": 0.07677835611245866, "3": 1.454720033063229e-05, "2": 5.793819488454531e-08, "1": 0}, "score": 4.923192371769622}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6744028812415598, "5": 0.3245741381687729, "3": 0.0010217473797458046, "2": 1.077500016128568e-06, "1": 3.842394515300249e-08}, "score": 4.323550158465051}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8099793139298272, "4": 0.18994114841249451, "3": 7.940200008825874e-05, "2": 1.1257299289106194e-07, "1": 0}, "score": 4.809899705479961}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6492583419027922, "5": 0.35018713358382414, "3": 0.000553995496672516, "2": 4.263624631423327e-07, "1": 2.5847033520618263e-08}, "score": 4.349632234675402}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960345589086921, "4": 0.003964880353550207, "3": 5.205837806399867e-07, "2": 1.718116850967977e-09, "1": 0}, "score": 4.996034073172104}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9551600671167332, "4": 0.04483057924386913, "3": 9.24647648083113e-06, "2": 4.254102212827496e-08, "1": 0}, "score": 4.955150797281862}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.927803491006685, "3": 0.07019150406426673, "5": 0.001878466737601535, "2": 0.00012645778764386545, "1": 8.350870157834832e-08}, "score": 3.9314337967848334}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954897667883319, "4": 0.004509506747833757, "3": 6.837058880679832e-07, "2": 1.7089443435836345e-09, "1": 0}, "score": 4.995489120528391}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7274156221223884, "4": 0.2724818425344526, "3": 0.00010241524289913723, "2": 1.0010662189660506e-07, "1": 0}, "score": 4.7273130212078796}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967880048291253, "4": 0.0032117670835124772, "3": 2.7662998996586963e-07, "1": 0, "2": 0}, "score": 4.996787679812442}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.988685535502964, "4": 0.011312194226760844, "3": 2.1958265982065947e-06, "2": 1.4641337109027006e-08, "1": 0}, "score": 4.98868336951927}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6494247551539382, "4": 0.35030229404468877, "3": 0.0002724345925531595, "2": 4.605824282424434e-07, "1": 2.303638302971291e-08}, "score": 4.649151351443227}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.883100105536974, "5": 0.11376463159688129, "3": 0.0031292988785036396, "2": 5.841347800468962e-06, "1": 1.1868665119441328e-07}, "score": 4.1106232944001375}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6345073740925224, "5": 0.36453376429966083, "3": 0.0009565559273138077, "2": 2.160342033416745e-06, "1": 9.221380396183713e-08}, "score": 4.363572630361543}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992909189168955, "4": 0.0007087818965389022, "3": 2.8000902560306886e-07, "1": 0, "2": 0}, "score": 4.999290658071807}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9923425105086414, "4": 0.007656104312420462, "3": 1.3528027588517815e-06, "1": 0, "2": 0}, "score": 4.992341189834098}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5753279804608562, "5": 0.42441528811499035, "3": 0.00025608452300240984, "2": 5.169151995358578e-07, "1": 0}, "score": 4.4241582248962}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999512916842885, "4": 4.859290623277195e-05, "3": 1.717100026801858e-09, "1": 0, "2": 0}, "score": 4.999951403654043}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6801533578426587, "4": 0.31965943996947793, "3": 0.000187006721108293, "2": 1.3534929900874895e-07, "1": 0}, "score": 4.679966121300786}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999810915907662, "4": 1.8826238429773462e-05, "3": 2.0684071885432617e-09, "1": 0, "2": 0}, "score": 4.999981169623248}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.526175800816282, "5": 0.47368402191961595, "3": 0.00013979395072828848, "2": 2.372704991565698e-07, "1": 0}, "score": 4.473543822585591}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8959911439862236, "5": 0.09688154812931896, "3": 0.007114685150004399, "2": 1.2418043773795046e-05, "1": 0}, "score": 4.0897420452611275}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999963211539712, "4": 3.6714785844258164e-05, "3": 3.3795945407871927e-08, "1": 0, "2": 0}, "score": 4.999963217620798}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5703225505752741, "5": 0.42858328318703814, "3": 0.0010905276688687948, "2": 3.513840356279057e-06, "1": 4.957297552428534e-08}, "score": 4.42748561124642}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995010654092793, "4": 0.0004987448079199256, "3": 9.823414237371343e-08, "1": 0, "2": 0}, "score": 4.999501058678118}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994228273682421, "4": 0.0005769320861673105, "3": 1.3645758543796158e-07, "1": 0, "2": 0}, "score": 4.999422794938582}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6046743864802623, "4": 0.39511461168642914, "3": 0.0002107295500403336, "2": 2.022300350693048e-07, "1": 1.9974986922253414e-08}, "score": 4.6044632228156495}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5133289044369593, "4": 0.4861935905163233, "3": 0.00047669532633860145, "2": 7.338068427354183e-07, "1": 0}, "score": 4.512850780429251}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7114351151920068, "5": 0.28815279538536903, "3": 0.00041142681623260635, "2": 5.387689619246395e-07, "1": 1.4602369892510278e-08}, "score": 4.287740278655431}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999558212119114, "4": 4.405172703974544e-05, "3": 2.7875156300194005e-08, "1": 0, "2": 0}, "score": 4.999955892518273}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999108230712783, "4": 0.0008915592159859125, "3": 1.2003157545320042e-07, "1": 0, "2": 0}, "score": 4.999108200640565}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9722694023623667, "3": 0.017276086792832518, "5": 0.010432090485451493, "2": 2.218795464269965e-05, "1": 8.982019484555332e-08}, "score": 3.9931113573405352}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.946386621138684, "5": 0.0455887866272091, "3": 0.008017252474708678, "2": 7.190966301930569e-06, "1": 4.90808941035935e-08}, "score": 4.037557008722107}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5343729048752954, "4": 0.4650759748345374, "3": 0.0005498120859646121, "2": 1.12904377533617e-06, "1": 0}, "score": 4.533820930341365}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979939120895003, "4": 0.0020054997448084974, "3": 5.6299167261977e-07, "2": 2.787292896890449e-09, "1": 0}, "score": 4.997993365865046}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5988958314978563, "4": 0.4009079857404057, "3": 0.00019577686326361355, "2": 3.2568245327580954e-07, "1": 0}, "score": 4.598699451294974}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9746366881165154, "4": 0.025349075982595164, "3": 1.399008071255635e-05, "2": 1.9510694359937225e-07, "1": 0}, "score": 4.974622357248167}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8034529755780655, "4": 0.19634369686524886, "3": 0.00020244546830588197, "2": 7.414322858777173e-07, "1": 4.018439904913988e-08}, "score": 4.803249007395779}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9967332830684905, "4": 0.003265054905530122, "3": 1.6286404026688828e-06, "2": 1.0456866426585485e-08, "1": 0}, "score": 4.9967316563681266}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980685896780097, "4": 0.0019299812328973578, "3": 1.3576300345528601e-06, "2": 1.8315649108209194e-08, "1": 0}, "score": 4.998067248457374}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997848044778788, "4": 0.00021502441030049404, "3": 9.741165229836429e-08, "1": 0, "2": 0}, "score": 4.999784780750533}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9642462219734979, "3": 0.02052668565700102, "5": 0.01520861857966961, "2": 1.8297611971363756e-05, "1": 7.698078436020664e-08}, "score": 3.9946451062251827}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6558090924490795, "4": 0.34399563866105354, "3": 0.00019479204584643554, "2": 4.131149307546151e-07, "1": 2.369281498402989e-08}, "score": 4.655613429343246}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6421405525808676, "5": 0.35702281203009645, "3": 0.0008349322284001465, "2": 1.6873775159073955e-06, "1": 2.1408517073681138e-08}, "score": 4.356184438817434}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995245187370612, "4": 0.0004752992273264788, "3": 1.0520626344127291e-07, "1": 0, "2": 0}, "score": 4.999524490323614}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9240149295031886, "4": 0.07593882477520762, "3": 4.6056760418045786e-05, "2": 1.5700738413454458e-07, "1": 0}, "score": 4.923968588252311}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6052121023465203, "4": 0.3937551931408991, "3": 0.0010278685394900335, "2": 4.421113369687831e-06, "1": 1.1721792826008659e-07}, "score": 4.6041752197543016}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.99646215238249, "4": 0.003537134651762849, "3": 7.563580210875409e-07, "2": 5.269517682124411e-09, "1": 0}, "score": 4.996461336995839}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5754350589613654, "4": 0.42300229686910434, "3": 0.0015596787631235417, "2": 2.80282141473516e-06, "1": 7.365078762009334e-08}, "score": 4.573869604639685}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977632735090398, "4": 0.0022362330563140227, "3": 4.96563731583475e-07, "1": 0, "2": 0}, "score": 4.997762773823223}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9991693935946331, "4": 0.000830313182525576, "3": 2.719742348372905e-07, "1": 0, "2": 0}, "score": 4.9991691428513505}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9874537645616959, "4": 0.01254563227344215, "3": 5.597990258733071e-07, "1": 0, "2": 0}, "score": 4.987453247584405}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9993508009909248, "4": 0.0006488480487689082, "3": 2.5059969789798377e-07, "1": 0, "2": 0}, "score": 4.999350650686668}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9964775357842957, "4": 0.0035205044147276748, "3": 1.8981933359060861e-06, "2": 2.243301677798889e-08, "1": 0}, "score": 4.996475631761483}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999279291732268, "4": 7.194490069790267e-05, "3": 6.397170843623701e-09, "1": 0, "2": 0}, "score": 4.99992804229636}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9701424641610179, "4": 0.029840313430459935, "3": 1.6734560265219397e-05, "2": 2.1756438657414934e-07, "1": 0}, "score": 4.970125556681271}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5431948139518482, "5": 0.4551349093108111, "3": 0.0016637137111049406, "2": 6.4597496163491145e-06, "1": 9.09524494967732e-08}, "score": 4.453458008831619}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9158826443844295, "4": 0.08409498038927878, "3": 2.2266772791852086e-05, "2": 1.1091163874393034e-07, "1": 0}, "score": 4.915860153537049}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7653563474140085, "5": 0.23415581714326644, "3": 0.0004870055688192197, "2": 7.945968164938509e-07, "1": 2.3776693518255818e-08}, "score": 4.233667153737999}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996766260266379, "4": 0.0003232718331432535, "3": 2.5035876019129683e-08, "1": 0, "2": 0}, "score": 4.999676678070175}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997131993651673, "4": 0.0002866713844891396, "3": 6.532931326077442e-08, "1": 0, "2": 0}, "score": 4.999713197938552}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7125259260947051, "4": 0.2873247700617427, "3": 0.0001490249226349259, "2": 2.7489682266236755e-07, "1": 1.6038977234117953e-08}, "score": 4.712376294702377}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9993572301650938, "4": 0.0006411291110700656, "3": 1.3370417950653045e-06, "1": 9.744146482505174e-08, "2": 0}, "score": 4.999355806906622}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9252459823103333, "4": 0.07469436684960891, "3": 5.933228292548909e-05, "2": 2.9035311986477875e-07, "1": 2.363942424082878e-08}, "score": 4.925186002625988}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991345294958276, "4": 0.0008653755356379412, "3": 9.670158922796766e-08, "1": 0, "2": 0}, "score": 4.999134431062683}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9920590978759786, "4": 0.007936515134538807, "3": 4.291814302893758e-06, "2": 6.522917491997634e-08, "1": 0}, "score": 4.9920547053114}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9071671563335862, "5": 0.062081241805313284, "3": 0.03050468501853688, "2": 0.00024420463893751025, "1": 2.4645138278578057e-06}, "score": 4.031080761665804}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9944097455512312, "4": 0.005589415270830833, "3": 8.3956410702758e-07, "2": 1.6825371069534456e-09, "1": 0}, "score": 4.994408900564911}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9977828580981066, "4": 0.0022166955122988564, "3": 4.893729300466601e-07, "2": 4.259862304818864e-09, "1": 0}, "score": 4.997782313067026}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957905178125495, "4": 0.004208972596105508, "3": 4.629262883324978e-07, "2": 2.647786047256051e-09, "1": 0}, "score": 4.9957900934226505}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7163872401667881, "5": 0.28269842092209907, "3": 0.0009129644643297513, "2": 1.3110686368191973e-06, "1": 0}, "score": 4.28178285217937}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8358671750830835, "5": 0.15489173344912618, "3": 0.009179057944870929, "2": 6.156820335457793e-05, "1": 4.419310334330599e-07}, "score": 4.14558821670954}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6951497006452458, "5": 0.3039225134600262, "3": 0.0009245462327542182, "2": 3.0296847098873563e-06, "1": 8.954092980014926e-08}, "score": 4.30299167572627}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7321322148142145, "5": 0.2664210038881223, "3": 0.0014449169978525888, "2": 1.5881130619059375e-06, "1": 3.636220230597968e-08}, "score": 4.264972865124537}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.962364761716314, "4": 0.0376289040187593, "3": 6.286003894737018e-06, "2": 6.292968109684169e-09, "1": 0}, "score": 4.962358503514806}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9256658153716424, "4": 0.07431562895884129, "3": 1.8399574842539744e-05, "2": 1.0693870682793653e-07, "1": 1.966298308528497e-08}, "score": 4.925647170230533}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"4": 0.935979579047022, "3": 0.047094879470267186, "5": 0.016853288129579546, "2": 7.18240629124431e-05, "1": 2.0791115248805865e-07}, "score": 3.9696141300732353}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9994484306703203, "4": 0.0005513693757495953, "3": 8.948498420384421e-08, "1": 0, "2": 0}, "score": 4.999448451593354}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7211628141940274, "5": 0.27783793580825705, "3": 0.0009976556313168975, "2": 1.5143746144032547e-06, "1": 2.868099868983363e-08}, "score": 4.276837179589449}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.997998663250427, "4": 0.0020009890413144695, "3": 3.1409071232652545e-07, "1": 0, "2": 0}, "score": 4.997998382709971}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9721073871667542, "4": 0.027884600386849596, "3": 7.890745033483853e-06, "2": 2.8034778731012877e-08, "1": 0}, "score": 4.972099531405406}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9537319584476279, "3": 0.03656415098003552, "5": 0.009621096880138324, "2": 8.250068183426776e-05, "1": 2.600908093966966e-07}, "score": 3.9728911633715946}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945693828058115, "4": 0.005429573463300579, "3": 1.0183845099515582e-06, "1": 0, "2": 0}, "score": 4.994568389630008}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9861077366197534, "4": 0.013887862802016497, "3": 4.276832040031339e-06, "2": 1.8780438765388465e-08, "1": 0}, "score": 4.986103525733934}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999446524524091, "4": 0.0005532846229333945, "3": 9.285218656410923e-08, "1": 0, "2": 0}, "score": 4.999446529618452}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9958589678178694, "4": 0.004137607734781788, "3": 3.3563482680393236e-06, "2": 5.8191473289237535e-08, "1": 0}, "score": 4.9958555049532}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5543585219571023, "5": 0.44476381078542476, "3": 0.0008768522954638764, "2": 6.780383413101496e-07, "1": 0}, "score": 4.443885663191731}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997193962066108, "4": 0.00028054792275020445, "3": 1.8502370091756334e-08, "1": 0, "2": 0}, "score": 4.9997194150620246}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9213272827385561, "4": 0.07860859770259017, "3": 6.391164342217581e-05, "2": 9.720049819793448e-08, "1": 0}, "score": 4.92126327869174}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999572515937392, "4": 4.2628607180742234e-05, "3": 2.0804573387685888e-08, "1": 0, "2": 0}, "score": 4.999957329779449}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963042760603569, "4": 0.0036949066085106477, "3": 8.469332101568023e-07, "1": 0, "2": 0}, "score": 4.996303399634496}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7311475813044153, "4": 0.2686798652794414, "3": 0.0001722614805127175, "2": 2.713007100694072e-07, "1": 1.7803549311559494e-08}, "score": 4.730974725881495}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7815206390002811, "4": 0.21840280320631664, "3": 7.641175594526568e-05, "2": 1.0081527047252803e-07, "1": 0}, "score": 4.781444060952404}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9362355052308035, "5": 0.06234172713136593, "3": 0.0014214212892795306, "2": 1.269966545457733e-06, "1": 0}, "score": 4.060917770562017}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998779876841082, "4": 0.00012195041869193968, "3": 3.624512309524491e-08, "1": 0, "2": 0}, "score": 4.999877977087932}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9435334072596524, "4": 0.05645494458095678, "3": 1.1489890456052663e-05, "2": 4.2014753774596675e-08, "1": 0}, "score": 4.94352194302806}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7357738842074502, "5": 0.2620477080510077, "3": 0.0021744728752965277, "2": 3.6961678176769368e-06, "1": 8.865734091630817e-08}, "score": 4.259865615858573}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9914118774354089, "4": 0.008586479190988991, "3": 1.6007392566784606e-06, "2": 7.447242554362723e-09, "1": 0}, "score": 4.991410296686523}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8423869918964164, "5": 0.15676976733808173, "3": 0.0008427648357752584, "2": 4.5711515385152863e-07, "1": 0}, "score": 4.155926091205682}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996051515131895, "4": 0.0003948277358340886, "3": 1.585498301860806e-08, "1": 0, "2": 0}, "score": 4.9996051405522675}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9963401267221257, "4": 0.0036592919740345816, "3": 5.395993053263193e-07, "1": 0, "2": 0}, "score": 4.996339628674701}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"5": 0.998916808176246, "4": 0.0010827580966935155, "3": 3.602271616185178e-07, "1": 0, "2": 0}, "score": 4.998916521369348}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7637157912552098, "4": 0.2361480830932187, "3": 0.00013581444212552307, "2": 2.3199175609145673e-07, "1": 0}, "score": 4.763579573318582}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9490613798621186, "5": 0.043888541791351154, "3": 0.0070345046719436696, "2": 1.545248076803109e-05, "1": 6.978240055617429e-08}, "score": 4.036822924703788}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8905391706192587, "4": 0.10941932054181895, "3": 4.131772389730597e-05, "2": 7.268963752857465e-08, "1": 0}, "score": 4.890497812973636}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6460501801277503, "4": 0.35367088559432236, "3": 0.0002778819985589373, "2": 1.016938413257952e-06, "1": 3.043958309518209e-08}, "score": 4.645770176098776}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9966117850987151, "4": 0.0033864147943929194, "3": 1.8237604630833102e-06, "2": 1.3559031232734729e-08, "1": 0}, "score": 4.996609897133741}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6359785771091316, "4": 0.36375878848674487, "3": 0.0002622867990594836, "2": 2.79598833116092e-07, "1": 0}, "score": 4.63571577434504}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6585113182627784, "5": 0.3410608404060841, "3": 0.0004274648479439428, "2": 3.526185356052553e-07, "1": 0}, "score": 4.340632678450151}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9865203344600257, "4": 0.013478285095845664, "3": 1.3247086625810043e-06, "2": 3.18029460933687e-09, "1": 0}, "score": 4.986519055237452}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9821170187800162, "4": 0.017876152803108888, "3": 6.80780370567723e-06, "2": 2.991101588960111e-08, "1": 0}, "score": 4.982110142022768}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8631499056746099, "5": 0.13528111936435538, "3": 0.001562894856686057, "2": 5.96341651711661e-06, "1": 1.1060804620578298e-07}, "score": 4.133705966663401}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.985901793749217, "4": 0.014091894571140708, "3": 6.184551926092302e-06, "2": 5.2085460303742296e-08, "1": 0}, "score": 4.9858955790102}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8636460486745609, "5": 0.13486796718095606, "3": 0.0014837865185643347, "2": 2.2248256610504926e-06, "1": 5.995503334188507e-08}, "score": 4.133379539521306}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9784117620131153, "4": 0.02157992919941951, "3": 8.178784602421687e-06, "2": 6.539003239246337e-08, "1": 0}, "score": 4.9784035156658675}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6936634350591977, "4": 0.30604507008991844, "3": 0.0002898969624543428, "2": 1.5666797294567719e-06, "1": 7.014866929503705e-08}, "score": 4.693370167291463}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.822791369863364, "3": 0.1764277737924581, "5": 0.0004464814070768365, "2": 0.000333840240926064, "1": 2.9084946675308604e-07}, "score": 3.8233501115088724}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9911710332646018, "4": 0.008827544403864377, "3": 1.4002412706677313e-06, "2": 1.0222057004167462e-08, "1": 0}, "score": 4.991169624342622}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7087867453451027, "5": 0.2904585784348668, "3": 0.0007529601147701448, "2": 1.6936865741768723e-06, "1": 7.039145211326114e-08}, "score": 4.289702005874785}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9878239928427085, "4": 0.012173648771901944, "3": 2.309187100289775e-06, "2": 1.1828582365397958e-08, "1": 0}, "score": 4.987821696913051}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921291436892532, "4": 0.00787000957427656, "3": 7.684149117550524e-07, "2": 6.287998628081194e-09, "1": 0}, "score": 4.992128434164887}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9880107358977873, "4": 0.011985328526485654, "3": 3.8423015843160766e-06, "2": 2.545432925920438e-08, "1": 0}, "score": 4.988006909693988}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999777296302151, "4": 0.00022252368780048643, "3": 6.681160793622206e-08, "1": 0, "2": 0}, "score": 4.999777342663779}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9690350949970539, "4": 0.030949584649191956, "3": 1.5158592879997774e-05, "2": 6.037021395999487e-08, "1": 0}, "score": 4.969019913913314}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998607127413711, "4": 0.00013919927756277716, "3": 1.99313493609208e-08, "1": 0, "2": 0}, "score": 4.999860760850263}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997945734529232, "4": 0.00020533043468342672, "3": 6.013366514914019e-08, "1": 0, "2": 0}, "score": 4.999794549290595}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7118035205046287, "4": 0.28794698374802935, "3": 0.0002481269618137301, "2": 1.0981781263818596e-06, "1": 5.754238674097527e-08}, "score": 4.71155317616649}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9963162272003491, "4": 0.0036832771249407665, "3": 4.410357054666726e-07, "2": 2.091613623920608e-09, "1": 0}, "score": 4.9963158343352125}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9755219020928274, "5": 0.02211424075337518, "3": 0.0023616069042849503, "2": 2.1150671427263933e-06, "1": 0}, "score": 4.0197484063844415}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999233997739472, "4": 7.65262300063724e-05, "3": 7.072937184206003e-09, "1": 0, "2": 0}, "score": 4.999923459618997}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996120625871847, "4": 0.0003878256403049861, "3": 1.2761997849606436e-08, "1": 0, "2": 0}, "score": 4.999612148797297}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5772529848217299, "4": 0.42235309364425566, "3": 0.00039296905093403597, "2": 7.872633652293646e-07, "1": 0}, "score": 4.576858536552469}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7185697722257143, "4": 0.2813766262833306, "3": 5.3559305713788127e-05, "2": 5.8169422899673754e-08, "1": 0}, "score": 4.7185160850962635}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8436477747392117, "4": 0.1562837365111919, "3": 6.829875636309079e-05, "2": 7.955668901724552e-08, "1": 0}, "score": 4.843579410031466}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998087558794887, "4": 0.00019112536193663124, "3": 3.614164627890858e-08, "1": 0, "2": 0}, "score": 4.9998088023389755}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.613145569868745, "5": 0.3851264334630683, "3": 0.0017120402346343295, "2": 1.513868756960641e-05, "1": 3.736164875528678e-07}, "score": 4.383383165275604}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6845877135160451, "5": 0.313059659867401, "3": 0.0023507508293614085, "2": 1.7119987677794109e-06, "1": 0}, "score": 4.310705535930474}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9969005397751192, "4": 0.003099084604401905, "3": 3.8567337671601125e-07, "1": 0, "2": 0}, "score": 4.996900144080007}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9814784673684075, "4": 0.018516815755404856, "3": 4.712254980828472e-06, "2": 4.1186228053992e-09, "1": 0}, "score": 4.981473747369455}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998850198707218, "4": 0.00011481539273610765, "3": 5.8756032990166226e-08, "1": 0, "2": 0}, "score": 4.999885067083017}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.906224075107831, "4": 0.09375134195944354, "3": 2.437905977688428e-05, "2": 4.7574449263769534e-08, "1": 0}, "score": 4.906199742536815}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8080896771886374, "4": 0.19160381545412353, "3": 0.00030499474835905604, "2": 1.3051938293255884e-06, "1": 6.694583348363122e-08}, "score": 4.807781984683623}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9953360985235803, "4": 0.0046621502976969455, "3": 1.7223050826951437e-06, "2": 8.936918446200042e-09, "1": 0}, "score": 4.995334378188366}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8414330994975847, "4": 0.15847979026641382, "3": 8.683124809398799e-05, "2": 2.1868423432425515e-07, "1": 0}, "score": 4.84134588161727}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990170941686999, "4": 0.0009825110180337723, "3": 3.2090554803369897e-07, "1": 0, "2": 0}, "score": 4.999016847098208}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8666499693160993, "4": 0.13318244817717032, "3": 0.00016603714991123892, "2": 1.3598107803386722e-06, "1": 0}, "score": 4.866481373316814}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7104489392265135, "4": 0.28929316305390285, "3": 0.00025764909389550746, "2": 2.5858742474516386e-07, "1": 0}, "score": 4.710190765883036}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9375559527361178, "5": 0.05912569366862273, "3": 0.003313070089457477, "2": 5.172300486695328e-06, "1": 3.7390843077631595e-08}, "score": 4.055802170924671}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8357392637586329, "4": 0.16419559653750385, "3": 6.496934595496916e-05, "2": 6.774995780440528e-08, "1": 0}, "score": 4.835674244659584}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998119737691479, "4": 0.00018791045721625567, "3": 3.685192429500398e-08, "1": 0, "2": 0}, "score": 4.9998120158241}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.992823584335202, "4": 0.007175929347071025, "3": 4.640725217770273e-07, "1": 0, "2": 0}, "score": 4.992823142348236}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5260165515049742, "4": 0.47375384809050924, "3": 0.0002290871635440814, "2": 4.396077433658863e-07, "1": 2.9377963043591748e-08}, "score": 4.525786520260876}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9648023927158587, "4": 0.03518551453384829, "3": 1.200561621194857e-05, "2": 2.8821621066117628e-08, "1": 0}, "score": 4.964790385715706}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.650522254655415, "5": 0.34890814020738303, "3": 0.0005687979406492461, "2": 7.930115900267653e-07, "1": 1.4626074155436249e-08}, "score": 4.348337712211675}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7814993037780635, "5": 0.2180551208975186, "3": 0.0004451627554861828, "2": 4.888505587532933e-07, "1": 0}, "score": 4.217608963841349}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9125689451965036, "4": 0.08740753388311641, "3": 2.3443366067574544e-05, "2": 7.452732502118131e-08, "1": 0}, "score": 4.912545355538049}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9569740317067604, "5": 0.03197162142877084, "3": 0.011036602831776626, "2": 1.748287023726319e-05, "1": 0}, "score": 4.0209000583148296}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8291790699464439, "4": 0.17051553023233904, "3": 0.00030476243088500523, "2": 6.493142701033878e-07, "1": 0}, "score": 4.828872999003589}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9843151980508552, "5": 0.012717821518581756, "3": 0.0029656284880692895, "2": 1.2600552358317954e-06, "1": 0}, "score": 4.009749673815912}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987633933289527, "4": 0.001236452978039071, "3": 6.415434604571945e-08, "1": 0, "2": 0}, "score": 4.998763418602547}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9760642498220691, "4": 0.02392668059033465, "3": 8.959868566521823e-06, "2": 2.2374005963156655e-08, "1": 0}, "score": 4.976055330459067}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9693826726832515, "5": 0.02209038572900966, "3": 0.008498150732823107, "2": 2.8571295442354464e-05, "1": 2.2131783526118717e-07}, "score": 4.013534428427998}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9079853907433352, "4": 0.09201012993549741, "3": 4.4207596947654465e-06, "1": 0, "2": 0}, "score": 4.9079810231563465}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8313470017380973, "5": 0.16762364850882017, "3": 0.0010281306793890202, "2": 1.1435386778075734e-06, "1": 3.045020836368381e-08}, "score": 4.166593146912271}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9909024434804489, "4": 0.009096302197188221, "3": 1.2210285263556248e-06, "1": 0, "2": 0}, "score": 4.990901255442827}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8081231651187253, "5": 0.19164756359885238, "3": 0.00022921136244158336, "2": 1.1487089401246267e-07, "1": 0}, "score": 4.191418111976023}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9511170205564458, "5": 0.04520563643630897, "3": 0.0036738173780420376, "2": 3.3882364268680697e-06, "1": 0}, "score": 4.041525048290655}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998741809658787, "4": 0.00012577310855781354, "3": 1.1745542852768263e-08, "1": 0, "2": 0}, "score": 4.999874203396057}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9961879698049902, "4": 0.0038101653188903927, "3": 1.913797633781533e-06, "1": 0, "2": 0}, "score": 4.996186007272429}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980536248495737, "4": 0.0019462127001182, "3": 1.2327169687043933e-07, "1": 0, "2": 0}, "score": 4.998053540680228}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9923212709345528, "4": 0.007677553018305535, "3": 1.1875229202033582e-06, "1": 0, "2": 0}, "score": 4.992320072023987}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7737464368765566, "5": 0.22433453082910085, "3": 0.0019159360055832559, "2": 3.016166209760475e-06, "1": 3.717237347830217e-08}, "score": 4.222412460526632}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7785942880601336, "4": 0.22124473322725696, "3": 0.00016006949392439535, "2": 8.357661398641581e-07, "1": 6.430875862316606e-08}, "score": 4.778432361225472}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.914917711991948, "4": 0.08500992199085322, "3": 7.218206139998372e-05, "2": 1.9198588178347522e-07, "1": 0}, "score": 4.914845138612502}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9956472677185699, "4": 0.004352287543651631, "3": 4.4984399143114335e-07, "1": 0, "2": 0}, "score": 4.995646812790593}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9669556964873139, "4": 0.03302567466053918, "3": 1.8457587968896233e-05, "2": 5.458563958788302e-08, "1": 0}, "score": 4.966937242548889}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9052228884730065, "5": 0.09122090378474193, "3": 0.003546624403904807, "2": 9.322767791665181e-06, "1": 1.0482767767242453e-07}, "score": 4.087655333013915}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.952929150255276, "4": 0.04705513404442299, "3": 1.5609076281182057e-05, "2": 1.0406376507173936e-07, "1": 0}, "score": 4.952913335491166}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8345874066692937, "4": 0.16523640052599323, "3": 0.000174963531007625, "2": 1.0682732479605632e-06, "1": 1.0382261697672597e-07}, "score": 4.834410042833703}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996859172843064, "4": 0.0003138234472793364, "3": 1.429032512992998e-07, "1": 0, "2": 0}, "score": 4.9996858907096655}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8196127552204668, "4": 0.1800735320718065, "3": 0.0003122476297063153, "2": 1.243043189326886e-06, "1": 0}, "score": 4.8192982034171195}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5179115003832173, "4": 0.48145466782281204, "3": 0.0006321535085726918, "2": 1.4507745089971884e-06, "1": 4.113921640242935e-08}, "score": 4.517276418313649}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8335395895157189, "4": 0.1663816721484323, "3": 7.851922960919758e-05, "2": 7.895356042880412e-08, "1": 0}, "score": 4.833461029190785}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9907510040380442, "4": 0.009243474831571558, "3": 5.468189409893337e-06, "2": 1.4580745208178578e-08, "1": 0}, "score": 4.990745544692371}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999497421129699, "4": 5.018095428343837e-05, "3": 3.162550252203975e-08, "1": 0, "2": 0}, "score": 4.999949755792435}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998810866107576, "4": 0.00011879490965210352, "3": 3.3302079315584e-08, "1": 0, "2": 0}, "score": 4.9998811384760655}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9795336989034704, "4": 0.020464338357553805, "3": 1.9575311422746674e-06, "2": 3.6879613914596987e-09, "1": 0}, "score": 4.9795317354851685}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998013666902087, "4": 0.00019849433446150416, "3": 3.1853295209914285e-08, "1": 0, "2": 0}, "score": 4.999801441937678}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6088668818357206, "5": 0.3905565249443889, "3": 0.0005764538347226226, "2": 1.643260948677268e-07, "1": 0}, "score": 4.38997973273102}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998908601961818, "4": 0.00010905611409417194, "3": 1.1041433041915583e-08, "1": 0, "2": 0}, "score": 4.9998909217951155}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995869316962124, "4": 0.0004129051716347112, "3": 4.696355319500994e-08, "1": 0, "2": 0}, "score": 4.999587000853282}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9247260106959516, "3": 0.06615513267317596, "5": 0.008877404950421611, "2": 0.00024069981061135656, "1": 4.6321061235207584e-07}, "score": 3.9422394663510754}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9933384153894582, "4": 0.006660460850846701, "3": 1.1255339642753378e-06, "1": 0, "2": 0}, "score": 4.993337288093047}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7295223675564813, "5": 0.2689219742515064, "3": 0.00155392234395537, "2": 1.49953874571721e-06, "1": 0}, "score": 4.267365116010926}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9830782959567472, "4": 0.016919931047825187, "3": 1.7957783658757698e-06, "1": 0, "2": 0}, "score": 4.983076477781011}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9715824840113535, "4": 0.028405783789212883, "3": 1.1559973350994406e-05, "2": 4.463225647420382e-08, "1": 0}, "score": 4.971570958739945}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9138883229037693, "4": 0.08601654650624209, "3": 9.447285626646802e-05, "2": 4.4750416142544613e-07, "1": 4.277115115753526e-08}, "score": 4.913792979748045}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9861267400850531, "4": 0.013869755122532062, "3": 3.4027113100481045e-06, "2": 1.093829393012402e-08, "1": 0}, "score": 4.986123405375214}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9021338423024421, "4": 0.09785881522800864, "3": 7.334282278735419e-06, "2": 4.706746179644258e-09, "1": 0}, "score": 4.902126501746544}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995104741568925, "4": 0.0004893155402529131, "3": 1.2498001405343642e-07, "1": 0, "2": 0}, "score": 4.999510434457949}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996474383244791, "4": 0.0003524722719290815, "3": 4.2350525814441803e-08, "1": 0, "2": 0}, "score": 4.9996474430104305}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"4": 0.959105835420231, "5": 0.03051187582019844, "3": 0.010348186417363769, "2": 3.39418768713824e-05, "1": 1.737101033283981e-07}, "score": 4.0200952842526245}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994175204286712, "4": 0.005822386789608766, "3": 2.4222516899591116e-06, "2": 1.7749029474727442e-08, "1": 0}, "score": 4.994172715641017}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6154007730008535, "4": 0.3844562425590742, "3": 0.00014273439962337152, "2": 2.5456694254585054e-07, "1": 0}, "score": 4.615257526682385}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989147838733853, "4": 0.0010850756184438092, "3": 6.43682717454683e-08, "1": 0, "2": 0}, "score": 4.998914795562386}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951327715320706, "4": 0.004866518425079462, "3": 7.231819403799539e-07, "1": 0, "2": 0}, "score": 4.995132035275001}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"4": 0.708642465226257, "5": 0.2899754832768545, "3": 0.0013781999711145359, "2": 3.686400685246139e-06, "1": 5.562155672216447e-08}, "score": 4.288589775241299}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7691189500261552, "4": 0.23080721130821855, "3": 7.373278601166673e-05, "2": 8.172278400241514e-08, "1": 0}, "score": 4.7690450723722675}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7600100896003109, "5": 0.2386684091042786, "3": 0.0013203580885088875, "2": 1.080149608535809e-06, "1": 1.6183720619329823e-08}, "score": 4.2373458532906385}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9518296159986547, "4": 0.04816023010814221, "3": 1.004325794323594e-05, "2": 2.515025000231919e-08, "1": 0}, "score": 4.95181960380652}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999177604552655, "4": 0.0008221822271062027, "3": 1.9540158222619804e-07, "1": 0, "2": 0}, "score": 4.999177426955073}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5700453841541958, "5": 0.42943847318843253, "3": 0.000515841660020187, "2": 2.5676155096419205e-07, "1": 0}, "score": 4.428922136979025}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6007679052394352, "3": 0.38524607231225344, "5": 0.009908718032570221, "2": 0.004073437668649899, "1": 3.6269408719075133e-06}, "score": 3.616504797595867}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9698534309647273, "5": 0.025457494499104626, "3": 0.0046867448468601546, "2": 2.0545062634053903e-06, "1": 0}, "score": 4.020766646354346}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872627077815181, "4": 0.012734658331546788, "3": 2.5055006077006603e-06, "1": 0, "2": 0}, "score": 4.987260329031638}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.982440457626337, "4": 0.017553977790907612, "3": 5.587765960291917e-06, "2": 1.2903296701144105e-08, "1": 0}, "score": 4.982434808601148}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7466877399889064, "5": 0.2517900685421047, "3": 0.0015203758575307751, "2": 1.6780653592373773e-06, "1": 1.9574815899352057e-08}, "score": 4.2502663073536455}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9978137060297925, "4": 0.002185341870941797, "3": 9.108195849214823e-07, "1": 0, "2": 0}, "score": 4.997812836399603}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9730930804605479, "4": 0.02690562517293973, "3": 1.2560395519600834e-06, "1": 0, "2": 0}, "score": 4.97309186171665}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872287751581414, "4": 0.01277031426000108, "3": 8.004834334313954e-07, "1": 0, "2": 0}, "score": 4.987228083366964}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999738221619941, "4": 0.0002617177303642486, "3": 3.285979378237039e-08, "1": 0, "2": 0}, "score": 4.999738216542773}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9982277414082239, "4": 0.0017717881289555698, "3": 4.059292311704241e-07, "1": 0, "2": 0}, "score": 4.99822739989819}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8109453524981486, "5": 0.18093668781225483, "3": 0.008066157954241298, "2": 5.043087354975428e-05, "1": 7.884057251197169e-07}, "score": 4.172767403523163}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8316320779240358, "4": 0.1683021000243807, "3": 6.574959806532435e-05, "2": 4.964014279512597e-08, "1": 0}, "score": 4.831566248016518}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951280486431444, "4": 0.004871036163206549, "3": 9.711499035339945e-07, "2": 3.322859930440407e-09, "1": 0}, "score": 4.995127011857273}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9449202751197147, "4": 0.055068979876674175, "3": 1.0627038529041724e-05, "2": 1.6204740727792908e-08, "1": 0}, "score": 4.944909711826038}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9502346232860807, "3": 0.03749476334088513, "5": 0.012186311077891452, "2": 8.383005191715134e-05, "1": 2.867746847710937e-07}, "score": 3.97452302258394}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5667959593910712, "4": 0.4326191496632023, "3": 0.0005837040892732425, "2": 1.0791336658301853e-06, "1": 2.4437426668080256e-08}, "score": 4.566210070879196}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6527506536660694, "4": 0.3470146086727448, "3": 0.00023408365652024943, "2": 5.098231174073664e-07, "1": 0}, "score": 4.65251564444403}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9991454832075968, "4": 0.000854419130023686, "3": 8.031567737448104e-08, "1": 0, "2": 0}, "score": 4.9991454202237975}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9689542808401282, "4": 0.031028336852765258, "3": 1.7149629295648887e-05, "2": 9.039562199317996e-08, "1": 0}, "score": 4.968937088282079}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9330968766789375, "5": 0.04787692612091361, "3": 0.01900547848618357, "2": 2.0460118615982458e-05, "1": 8.251382350546401e-08}, "score": 4.028830284932508}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9990596803778353, "4": 0.000939832396681941, "3": 3.9005230165755116e-07, "1": 0, "2": 0}, "score": 4.999059387407312}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9793372270885586, "4": 0.020660582936128536, "3": 2.16970574714604e-06, "2": 4.331867909836688e-09, "1": 0}, "score": 4.979335064327423}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981027961706828, "4": 0.001897089138385709, "3": 1.4951965218684656e-07, "1": 0, "2": 0}, "score": 4.9981026118883936}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9858783857608171, "4": 0.014120537232688572, "3": 1.052332951395891e-06, "1": 0, "2": 0}, "score": 4.985877357752953}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9464696919772162, "5": 0.04195856480179684, "3": 0.011564965111902492, "2": 6.4466173924496235e-06, "1": 4.671395007822892e-08}, "score": 4.030380574964971}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9751451804925202, "4": 0.024844725561853246, "3": 1.0014344928722335e-05, "2": 2.2213402811327135e-08, "1": 0}, "score": 4.975135177681156}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8350633823550809, "4": 0.1648457320004565, "3": 9.058825401080987e-05, "2": 1.7470971705040575e-07, "1": 0}, "score": 4.834972547116682}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9793969204910548, "4": 0.020598294456251758, "3": 4.822630653742915e-06, "2": 2.091680362113666e-08, "1": 0}, "score": 4.979391998737491}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9839130870495755, "4": 0.016084374599871495, "3": 2.5047966609390456e-06, "2": 1.1391265037806504e-08, "1": 0}, "score": 4.983910581276428}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9053804833900955, "5": 0.08551520351144584, "3": 0.009068313271593754, "2": 3.55521117936906e-05, "1": 3.5983724677948105e-07}, "score": 4.076374713216167}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5842650770948176, "4": 0.41559209526221136, "3": 0.00014245334718987417, "2": 1.972018526588998e-07, "1": 0}, "score": 4.584122332788442}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9505070328265155, "5": 0.030435980541293234, "3": 0.019029935253847864, "2": 2.6602908660914873e-05, "1": 1.4932495495284162e-07}, "score": 4.011352394891268}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9591998180098814, "4": 0.0407928442085284, "3": 7.195260590530419e-06, "2": 2.5734688707248736e-08, "1": 0}, "score": 4.959192683300489}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9613884406980086, "3": 0.031499122206473044, "5": 0.006959344431141487, "2": 0.00015210674710776747, "1": 8.719114206679684e-07}, "score": 3.9751533901635323}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9055079110789829, "5": 0.07214323219738288, "3": 0.022130308160606973, "2": 0.0002164255390855742, "1": 1.9314732582587286e-06}, "score": 4.049574288034818}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9348326122983956, "3": 0.03631777456922735, "5": 0.02859223790258608, "2": 0.0002567994828434473, "1": 5.213860972874265e-07}, "score": 3.991759299761409}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9007430906920559, "5": 0.09696515420685242, "3": 0.0022888380315394716, "2": 2.88334926577947e-06, "1": 6.386087167322214e-08}, "score": 4.094670355040747}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995585806741905, "4": 0.00044129013338755626, "3": 9.417905746361425e-08, "2": 1.1052293134749251e-09, "1": 0}, "score": 4.999558518177839}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9040133418637777, "4": 0.09596882306497588, "3": 1.769100923961893e-05, "2": 3.996411142281013e-08, "1": 0}, "score": 4.903995665030361}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9708202541375854, "5": 0.025258339514209405, "3": 0.003916132575737244, "2": 5.1431593900648315e-06, "1": 3.1745590599759115e-08}, "score": 4.021331827491945}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9802069481788835, "4": 0.01979213188110642, "3": 9.48131150358551e-07, "2": 5.388391066601329e-09, "1": 0}, "score": 4.980205956356095}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9649359045543496, "5": 0.034665164540852555, "3": 0.0003988242557043913, "2": 1.4783944250425226e-07, "1": 0}, "score": 4.034266043194833}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974632328456957, "4": 0.002536683651676971, "3": 6.834530272403544e-08, "1": 0, "2": 0}, "score": 4.997463179619266}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990350507132767, "4": 0.0009648286858516994, "3": 3.944671748844253e-08, "1": 0, "2": 0}, "score": 4.999035092342407}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.882963549080312, "3": 0.1125295303255428, "5": 0.004300869789972545, "2": 0.00020568555240790896, "1": 2.0701946795738039e-07}, "score": 3.8913593301107468}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9938392954439327, "4": 0.006160439232508896, "3": 2.1927460247867883e-07, "1": 0, "2": 0}, "score": 4.993839121934585}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9785464379192639, "5": 0.01569996179610411, "3": 0.005750465907868692, "2": 3.1646661176073563e-06, "1": 1.9205041773773195e-08}, "score": 4.009943108448747}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9912909662680411, "4": 0.008708648209415089, "3": 2.6796592769081205e-07, "1": 0, "2": 0}, "score": 4.991290814834907}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8076566248751278, "5": 0.19013774420216656, "3": 0.002200679725943901, "2": 4.702299093606002e-06, "1": 9.203830388219014e-08}, "score": 4.187927413241298}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8171411768239892, "5": 0.18264209612758378, "3": 0.00021659853219284681, "2": 1.0545642526652442e-07, "1": 0}, "score": 4.182425290889233}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9994246143578434, "4": 0.0005753353326138177, "3": 1.8810850111455292e-08, "1": 0, "2": 0}, "score": 4.999424627027562}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9946116042663053, "4": 0.005387990950506098, "3": 4.5262267752399015e-07, "2": 2.961331022257409e-09, "1": 0}, "score": 4.994611095193906}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9924682582939712, "4": 0.00753100560203375, "3": 6.928987169673176e-07, "1": 0, "2": 0}, "score": 4.992467608275093}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9915564973016904, "4": 0.008442409713893448, "3": 9.88801730641778e-07, "1": 0, "2": 0}, "score": 4.9915556118028865}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8896461264983919, "5": 0.10910735207592476, "3": 0.0012445757128999408, "2": 1.8880707829017687e-06, "1": 0}, "score": 4.107859006438669}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9064774092021214, "4": 0.0934894951814385, "3": 3.294615486104317e-05, "2": 3.5880351616961524e-08, "1": 0}, "score": 4.906444494241636}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6071533705918398, "4": 0.3928040468435636, "3": 4.2638881913128274e-05, "2": 2.0263532398337124e-08, "1": 0}, "score": 4.607110644689813}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978246305531745, "4": 0.0021751438036639362, "3": 1.9772315336407864e-07, "1": 0, "2": 0}, "score": 4.997824460689289}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9057077597096789, "5": 0.09086696183731882, "3": 0.003420618145300444, "2": 4.360468727824334e-06, "1": 0}, "score": 4.087437648971777}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6761786247824382, "4": 0.3233350457606125, "3": 0.0004843035395461647, "2": 1.8116418942133052e-06, "1": 0}, "score": 4.675690842743102}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6913917526805645, "5": 0.2875357438608803, "3": 0.020886944087851616, "2": 0.00018360221786061518, "1": 1.7974635962324362e-06}, "score": 4.266276245467972}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8015754863659037, "5": 0.19703602479156787, "3": 0.0013853686520440577, "2": 3.03046949985313e-06, "1": 5.644867605702493e-08}, "score": 4.195644432364037}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9586637914468363, "4": 0.041324571679961127, "3": 1.139002027997209e-05, "2": 2.8770306672082104e-08, "1": 0}, "score": 4.958652552951399}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9846014795182146, "4": 0.015392661640245057, "3": 5.818610909802935e-06, "2": 1.890841076214527e-08, "1": 0}, "score": 4.984595644084249}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9034582854192034, "5": 0.09065753711579305, "3": 0.005870796290989596, "2": 1.3301935593229324e-05, "1": 6.449358986637897e-08}, "score": 4.0847599447226175}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8749196459862646, "4": 0.12504751423810306, "3": 3.280610276410232e-05, "2": 5.468020915635742e-08, "1": 0}, "score": 4.874886712144038}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9948851526080389, "4": 0.005112713490254964, "3": 2.1106407153640172e-06, "2": 1.5162993739617204e-08, "1": 0}, "score": 4.994883019697896}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997348848192421, "4": 0.0002646106652575295, "3": 3.957219574304137e-07, "1": 0, "2": 0}, "score": 4.999734597861953}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999604699583327, "4": 3.939506513049241e-05, "3": 8.0924598381074e-08, "1": 0, "2": 0}, "score": 4.999960443083535}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5885877826641722, "4": 0.4110321926244248, "3": 0.00037826800713175365, "2": 1.6539850501615935e-06, "1": 5.518636086351367e-08}, "score": 4.588206069086976}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7602059010198999, "4": 0.23973373716275606, "3": 6.0215064264603335e-05, "2": 9.059806334581048e-08, "1": 0}, "score": 4.760145547445494}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8203039308652252, "5": 0.17911747562439456, "3": 0.0005780164092436386, "2": 5.261318448548434e-07, "1": 0}, "score": 4.178538416051437}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983691182353623, "4": 0.0016305905975561555, "3": 2.9748500993597956e-07, "2": 3.575810404201538e-09, "1": 0}, "score": 4.9983688037211325}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.651026298830783, "5": 0.34751616398303103, "3": 0.0014525955329600271, "2": 4.967750182120127e-06, "1": 3.407257596904652e-08}, "score": 4.346053509910101}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8684395486858315, "4": 0.13140994379944926, "3": 0.00014929266259578166, "2": 1.0181492902986758e-06, "1": 9.185321712879266e-08}, "score": 4.868288035204671}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9927842260143119, "4": 0.007213918457017559, "3": 1.7948268555143754e-06, "2": 8.739621105431275e-09, "1": 0}, "score": 4.9927824652953685}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9538759761697901, "5": 0.041012527917009794, "3": 0.005104039469076571, "2": 7.279400849757984e-06, "1": 8.045997348238139e-08}, "score": 4.035893691733044}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984355366506503, "4": 0.0015642190329834915, "3": 2.4437228896932005e-07, "2": 1.5475450505004995e-09, "1": 0}, "score": 4.998435287582312}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9820099826971131, "4": 0.0179862446380595, "3": 3.795649558891284e-06, "2": 1.5673836181156974e-08, "1": 0}, "score": 4.982006117736931}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5611299838670709, "5": 0.4383692268680065, "3": 0.0005004035425300471, "2": 2.553866923077849e-07, "1": 0}, "score": 4.437868369621973}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999444975683012, "4": 0.0005548404294847127, "3": 1.0871435400210297e-07, "1": 0, "2": 0}, "score": 4.999444942100083}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9699915847866705, "5": 0.02536214426376336, "3": 0.004643912763959669, "2": 2.0300563635509336e-06, "1": 0}, "score": 4.0207141781840035}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.987231563096139, "4": 0.012765845432100579, "3": 2.5223362565175704e-06, "1": 0, "2": 0}, "score": 4.987229109012464}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9926494742321964, "4": 0.0073494360249552046, "3": 1.0501631761625375e-06, "1": 0, "2": 0}, "score": 4.992648463357721}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8661269479472763, "4": 0.13380052600736955, "3": 7.218826932420113e-05, "2": 2.4651142392850383e-07, "1": 0}, "score": 4.866054345695212}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8978219305001224, "4": 0.1019556157606547, "3": 0.0002219179142719909, "2": 5.298351057684959e-07, "1": 0}, "score": 4.897598958292118}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7250729416614647, "5": 0.2741096692326214, "3": 0.0008170804483167203, "2": 3.2403801428381843e-07, "1": 0}, "score": 4.273291936504932}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9846343135712077, "4": 0.015363961106059858, "3": 1.698661448986484e-06, "1": 0, "2": 0}, "score": 4.984632641161329}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8224587003037099, "4": 0.17742664909693953, "3": 0.00011414602593561271, "2": 3.997961678874345e-07, "1": 2.1086706894519617e-08}, "score": 4.822343760247711}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9917628259767853, "4": 0.008228788339334743, "3": 8.336184002169125e-06, "2": 5.125221501791954e-08, "1": 0}, "score": 4.991754385550466}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9312792000700784, "3": 0.05612386252164593, "5": 0.012468796943585493, "2": 0.00012784959806926382, "1": 1.4911723921923798e-07}, "score": 3.9560887816496955}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9474781092370967, "4": 0.052497722042110714, "3": 2.4014565881106196e-05, "2": 3.787024975471227e-08, "1": 0}, "score": 4.9474541291050995}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997193962066108, "4": 0.0002804371282040812, "3": 6.400696060803993e-08, "1": 0, "2": 0}, "score": 4.999719434829072}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9994896312224745, "4": 0.000510273347673119, "3": 1.6039859402125224e-08, "1": 0, "2": 0}, "score": 4.999489694532094}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6835753414482909, "4": 0.31326459315567673, "2": 0.0030044964372368432, "5": 0.0001549600835026257, "1": 5.321954648253052e-07}, "score": 3.3105689763088906}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.998329428360833, "4": 0.0016702561184020047, "3": 2.3554473122950182e-07, "1": 0, "2": 0}, "score": 4.998329272658517}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9950620579196151, "4": 0.004933846361949201, "3": 4.035291564471481e-06, "2": 4.054157253317725e-09, "1": 0}, "score": 4.995058070613861}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7974506476998181, "4": 0.20239308645160917, "3": 0.00015578074813095807, "2": 5.34286833932369e-07, "1": 2.062798887651281e-08}, "score": 4.797293680831488}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999608011247674, "4": 0.0003918504876440706, "3": 1.1007388663053402e-07, "1": 0, "2": 0}, "score": 4.999607929353529}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8759219063692247, "5": 0.12101824011429549, "3": 0.0030552116771585423, "2": 4.682309906665069e-06, "1": 5.636260106928105e-08}, "score": 4.1179534833077085}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.948569223683232, "4": 0.05140416904424635, "3": 2.6496418103857493e-05, "2": 4.069530937137853e-08, "1": 0}, "score": 4.94854271242342}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9582147051608674, "4": 0.04175904518554356, "3": 2.6121573870299018e-05, "2": 8.512909226794397e-08, "1": 0}, "score": 4.958188454483607}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987889503132686, "4": 0.001210888852752877, "3": 1.7236370995082751e-07, "1": 0, "2": 0}, "score": 4.998788766433792}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9348030159664027, "4": 0.06515749107868175, "3": 3.929037421521861e-05, "2": 6.674209324103689e-08, "1": 0}, "score": 4.934763719085002}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8966325357483445, "5": 0.09853626755939657, "3": 0.0048226505279309355, "2": 8.499042906866034e-06, "1": 8.349625970875541e-08}, "score": 4.0936963650486815}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9863107458189231, "4": 0.013686894634498986, "3": 2.2383065107783737e-06, "1": 0, "2": 0}, "score": 4.986308627092536}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9880753163660383, "4": 0.011920385228976364, "3": 4.145674733979256e-06, "2": 1.0020448317751786e-08, "1": 0}, "score": 4.988071291657868}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997602541136392, "4": 0.00023969147079253781, "3": 3.285131704912019e-08, "1": 0, "2": 0}, "score": 4.999760242821404}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997076020866047, "4": 0.0002923104896213131, "3": 2.9414296655460164e-08, "1": 0, "2": 0}, "score": 4.999707630664825}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9792608564528249, "4": 0.020734846256429417, "3": 4.263961074551192e-06, "2": 1.3407789404969103e-08, "1": 0}, "score": 4.979256585184805}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9865935557299002, "4": 0.013397618656760561, "3": 8.730630224971522e-06, "2": 3.101415883874589e-08, "1": 0}, "score": 4.986584826182159}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5410905494103591, "4": 0.4584037192808971, "3": 0.0005048034057644629, "2": 9.127434432023857e-07, "1": 4.281484280365702e-08}, "score": 4.54058377712317}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982054077098722, "4": 0.0017944943426262475, "3": 5.437197398155851e-08, "1": 0, "2": 0}, "score": 4.998205396835225}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5476641526704781, "4": 0.45170512064548163, "3": 0.000625050319667967, "2": 5.3277689015531335e-06, "1": 2.2140018081122675e-07}, "score": 4.547027852191831}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7251497237004105, "4": 0.27448452358623493, "3": 0.0003638508598408492, "2": 1.6992951678881832e-06, "1": 8.537265384659693e-08}, "score": 4.724782303066387}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9853428059618157, "4": 0.014656452453097931, "3": 7.058119462638588e-07, "1": 0, "2": 0}, "score": 4.9853421353986525}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9818492967854356, "4": 0.018147798870104804, "3": 2.93316943834697e-06, "1": 0, "2": 0}, "score": 4.981846335314298}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993787777684812, "4": 0.0006212048868068895, "3": 2.326101624824777e-08, "1": 0, "2": 0}, "score": 4.999378748594836}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9794329414133812, "4": 0.02056662423230725, "3": 4.927844399511731e-07, "1": 0, "2": 0}, "score": 4.9794323914005805}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.878740189564332, "3": 0.1162082312679004, "5": 0.004681089485960469, "2": 0.00036976876764533654, "1": 5.383801111261601e-07}, "score": 3.8877316850496455}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9488794233289036, "4": 0.0511022372975497, "3": 1.8225843473785445e-05, "2": 4.1188530717055855e-08, "1": 0}, "score": 4.94886118375045}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9428148519701084, "3": 0.0403615088261304, "5": 0.01675251806116391, "2": 7.067539962476282e-05, "1": 3.209970191489033e-07}, "score": 3.976248692481846}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9870482640475343, "4": 0.012949423619161056, "3": 2.1884642846618202e-06, "1": 0, "2": 0}, "score": 4.987046197847694}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9499156764107459, "5": 0.026687755880797713, "3": 0.02334216260075102, "2": 5.425127844580954e-05, "1": 1.482662044724673e-07}, "score": 4.003236645942548}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9828079708696722, "3": 0.008839768415653546, "5": 0.008346018334619568, "2": 6.31143178412083e-06, "1": 2.8380118209034144e-08}, "score": 3.999493541964388}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5937200897856539, "4": 0.4062232311756106, "3": 5.663904327798399e-05, "2": 2.200344070796623e-08, "1": 0}, "score": 4.593663417416697}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8471752999856235, "3": 0.15185336920779108, "5": 0.0008857011205429453, "2": 8.555150206809682e-05, "1": 1.0980091220802296e-07}, "score": 3.848860904284435}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9959361705941137, "4": 0.004062880801359248, "3": 9.124267761725002e-07, "2": 7.989513241401641e-09, "1": 0}, "score": 4.995935270261972}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9795755621297084, "4": 0.020419360174759624, "3": 5.045584770368657e-06, "2": 5.339958262585906e-09, "1": 0}, "score": 4.979570532088911}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8384141400834761, "3": 0.1557099184280374, "5": 0.005473481463583906, "2": 0.00040182776758286283, "1": 5.604117811236206e-07}, "score": 3.848958215413359}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9683455957686761, "4": 0.03161892959260789, "3": 3.515291545162382e-05, "2": 1.7201657474142804e-07, "1": 3.2183433640571916e-08}, "score": 4.96831011606873}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5079349148427807, "5": 0.49080916142965686, "3": 0.001252209610237444, "2": 3.4814454194337448e-06, "1": 1.0304294436785834e-07}, "score": 4.489549743259573}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9609461403537322, "4": 0.03901091890945658, "3": 4.252769700751264e-05, "2": 1.7311079740843074e-07, "1": 0}, "score": 4.960903496983751}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9935141803170263, "4": 0.006483770957450337, "3": 2.061684893505025e-06, "1": 0, "2": 0}, "score": 4.993512105756841}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9986799180757021, "4": 0.0013198708342667205, "3": 1.913172102177972e-07, "1": 0, "2": 0}, "score": 4.998679746505208}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6083646034641343, "4": 0.3914942581274324, "3": 0.00014110785936266465, "2": 1.0460557379250986e-07, "1": 0}, "score": 4.608223241350738}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5401596148739434, "5": 0.45886665183884157, "3": 0.0009727449865563166, "2": 9.292825501244659e-07, "1": 3.522471042215998e-08}, "score": 4.45789195350786}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9347591691244838, "4": 0.06523216522668382, "3": 8.554329747312395e-06, "1": 0, "2": 0}, "score": 4.9347507188503315}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6569906447134825, "5": 0.3428204288349122, "3": 0.00018884764105271004, "2": 1.0740941454582439e-07, "1": 0}, "score": 4.342631356576164}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8451232874161759, "4": 0.1547963030836892, "3": 8.029774657364718e-05, "2": 8.95997775203873e-08, "1": 0}, "score": 4.845042829190944}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996547035685396, "4": 0.0003452008970913922, "3": 2.7741260036553257e-08, "1": 0, "2": 0}, "score": 4.999654743596982}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9806520190374717, "4": 0.019344417546868425, "3": 3.627394267853154e-06, "2": 5.613204883775584e-09, "1": 0}, "score": 4.980648312171701}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999971839107652, "4": 2.7455435171444323e-06, "3": 2.071085439900147e-09, "1": 0, "2": 0}, "score": 4.999997250314124}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.990798163422059, "4": 0.009200274117413346, "3": 1.4769520786484234e-06, "1": 0, "2": 0}, "score": 4.9907967711914765}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9592866889973459, "4": 0.04070031284311937, "3": 1.2905435225801576e-05, "2": 2.8369562768493982e-08, "1": 0}, "score": 4.959273788556815}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9569907310493151, "4": 0.0429447230813956, "3": 6.423360768810743e-05, "2": 1.9200642537188842e-07, "1": 0}, "score": 4.956926228504107}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8933394474574305, "5": 0.10508572850457785, "3": 0.0015738044095787828, "2": 7.912040008220293e-07, "1": 0}, "score": 4.103510365331291}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9667969005919039, "4": 0.033193025514266554, "3": 1.0009128813930371e-05, "2": 4.683598590048954e-08, "1": 0}, "score": 4.966786815124669}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9985769683710901, "4": 0.001422742403219682, "3": 2.3489294025272443e-07, "1": 0, "2": 0}, "score": 4.9985767877335725}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"3": 0.49938431965372404, "4": 0.34061482008507304, "2": 0.15734547711347976, "5": 0.0023486546596820377, "1": 0.0003066937086796035}, "score": 3.187353271389625}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7149261702580447, "4": 0.28497306840589887, "3": 0.00010054722905570271, "2": 1.678642869123896e-07, "1": 7.053548594648976e-09}, "score": 4.714825294153176}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7676611685268494, "4": 0.23221818422859156, "3": 0.00012047346942760087, "2": 2.358284978791457e-07, "1": 1.6285739326765552e-08}, "score": 4.7675401144148015}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971209381705703, "4": 0.002878564921984766, "3": 4.429269406623821e-07, "2": 5.393318307442241e-09, "1": 0}, "score": 4.997120532904273}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9724597612035698, "4": 0.027538402332016303, "3": 1.7783083690494555e-06, "2": 3.143955866030759e-09, "1": 0}, "score": 4.972458030104238}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5442073427404102, "5": 0.45537227852930345, "3": 0.00041968883093471696, "2": 5.688648232640669e-07, "1": 3.0990659013904876e-08}, "score": 4.454951399962329}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9917926031108846, "4": 0.008204711635748268, "3": 2.6279249909650235e-06, "2": 4.818235763775719e-09, "1": 0}, "score": 4.991790017628455}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9654238734359747, "4": 0.03456132488459411, "3": 1.4743488946383745e-05, "2": 4.609828911985782e-08, "1": 0}, "score": 4.965409049424365}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997660937103428, "4": 0.00023381601793564968, "3": 7.384083046482391e-08, "1": 0, "2": 0}, "score": 4.99976603629656}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9929781289560665, "4": 0.007018320040877743, "3": 3.5085314442092994e-06, "2": 1.9125276496595306e-08, "1": 0}, "score": 4.992974605356387}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9561411388952663, "5": 0.035915098531334844, "3": 0.007938737669916903, "2": 4.918101381534348e-06, "1": 4.4022366616148236e-08}, "score": 4.0279663943472785}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8867111570582212, "4": 0.11326028522261825, "3": 2.841702842645654e-05, "2": 5.59534355579196e-08, "1": 0}, "score": 4.88668270325802}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8995374699850104, "4": 0.10041302992658037, "3": 4.931811994106669e-05, "2": 1.0538157777858783e-07, "1": 0}, "score": 4.899488009990903}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.985174442997957, "4": 0.01482165488046191, "3": 3.857855881240588e-06, "2": 1.9873413569387725e-08, "1": 0}, "score": 4.9851705694258115}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9908476669165364, "4": 0.009150717385327599, "3": 1.5021306866278294e-06, "1": 0, "2": 0}, "score": 4.990846277313735}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.992359539252228, "4": 0.007636692411324975, "3": 3.764473677413924e-06, "2": 2.3550848203472387e-08, "1": 0}, "score": 4.992355708139277}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9419266817236619, "3": 0.05148154937848193, "5": 0.006271419841332172, "2": 0.00031948954745584867, "1": 8.441758592626136e-07}, "score": 3.9541483581373083}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9761721528562899, "5": 0.013346162348414082, "3": 0.01047306558413304, "2": 8.396110458552026e-06, "1": 0}, "score": 4.002856305180607}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999568939990904, "4": 4.3066074731627175e-05, "3": 6.058194612385875e-09, "1": 0, "2": 0}, "score": 4.99995692180742}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9693997010088392, "4": 0.030595094296004547, "3": 5.107456638809609e-06, "2": 3.541766960330445e-08, "1": 0}, "score": 4.969394582645656}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8100059059872098, "5": 0.18699359762745435, "3": 0.002995713036872025, "2": 4.528105128083422e-06, "1": 6.368708768613303e-08}, "score": 4.183988672563243}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9050161410743408, "3": 0.0848916450340755, "5": 0.009687770132948345, "2": 0.000403844643399805, "1": 3.555002089285188e-07}, "score": 3.923987350793623}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9484868497144647, "3": 0.037573209343785614, "5": 0.013916452579231296, "2": 2.342686774595361e-05, "1": 0}, "score": 3.9762963880423055}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7673317513763307, "4": 0.2325843090768449, "3": 8.367552806345272e-05, "2": 2.1055298611254058e-07, "1": 0}, "score": 4.767247695763787}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7865821907787611, "5": 0.20937340381542188, "3": 0.004031973583281633, "2": 1.2086879893128763e-05, "1": 0}, "score": 4.205317327295055}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5285395933585934, "5": 0.4705979306299344, "3": 0.000859673750994833, "2": 2.465332182287974e-06, "1": 1.0282955759598897e-07}, "score": 4.4697331276898336}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6427387923606428, "5": 0.3564813338377484, "3": 0.0007770572729132773, "2": 2.440486874096977e-06, "1": 0}, "score": 4.3556995293489855}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9536597474587644, "5": 0.040979226967594484, "3": 0.005349031834309977, "2": 1.1612737522463999e-05, "1": 1.1860359961002299e-07}, "score": 4.035606623190555}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964862965543579, "4": 0.003512667354668701, "3": 1.0137137403486244e-06, "1": 0, "2": 0}, "score": 4.996485305139201}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5278791310223476, "5": 0.4709709660837614, "3": 0.0011424518277269266, "2": 7.085061532228452e-06, "1": 2.8984109859990523e-07}, "score": 4.469813510392331}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9626190876935424, "5": 0.02588452446141099, "3": 0.011486779656398705, "2": 9.48259068521631e-06, "1": 3.201372883686692e-08}, "score": 4.014378684928074}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9966377184707047, "4": 0.0033617328795258897, "3": 4.92735656706428e-07, "1": 0, "2": 0}, "score": 4.996637281461138}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8520473147079354, "5": 0.14686991734399094, "3": 0.001081692429563022, "2": 9.927499671747718e-07, "1": 0}, "score": 4.1457862514810095}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9799705948723317, "4": 0.020027979661865505, "3": 1.412323976638992e-06, "1": 0, "2": 0}, "score": 4.97996919542694}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9981842644459527, "4": 0.0018155574925483, "3": 1.726343608818726e-07, "1": 0, "2": 0}, "score": 4.998184097228875}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"4": 0.887355994958238, "5": 0.10702183499124411, "3": 0.005607109123602122, "2": 1.4785545645464003e-05, "1": 1.77499507976174e-07}, "score": 4.101384632201534}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8838691567727177, "3": 0.07191395816964029, "5": 0.043200811464846674, "2": 0.0010120823883677612, "1": 3.85141863851266e-06}, "score": 3.9692511299642996}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9763037194665093, "4": 0.023692785179333844, "3": 3.4864135020028573e-06, "1": 0, "2": 0}, "score": 4.976300241781771}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947836848695213, "4": 0.005214941021444338, "3": 1.3139548489787836e-06, "2": 5.924135901322875e-09, "1": 0}, "score": 4.994782413013501}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9849109593451264, "4": 0.015086243151329332, "3": 2.78688241745791e-06, "2": 1.0226054609937094e-08, "1": 0}, "score": 4.98490815239971}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6373373957337393, "5": 0.3616749857017156, "3": 0.0009846266738056187, "2": 2.899494924806385e-06, "1": 0}, "score": 4.360684593363807}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.99997334352929, "4": 2.659229621768239e-05, "3": 5.233628571056269e-09, "1": 0, "2": 0}, "score": 4.999973397234958}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6703259582845184, "5": 0.3295282476112865, "3": 0.00014575724872618079, "2": 7.484825796741786e-08, "1": 0}, "score": 4.329382328151891}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999718085325412, "4": 0.00028177800876333955, "3": 1.4281754834714285e-08, "1": 0, "2": 0}, "score": 4.999718193393238}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984859280651871, "4": 0.001514016084771298, "3": 6.886450214759268e-08, "1": 0, "2": 0}, "score": 4.998485846205931}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9980080433841444, "4": 0.001991279265098607, "3": 6.195112352778145e-07, "2": 5.747654375849438e-09, "1": 0}, "score": 4.998007464365673}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.791373361948706, "4": 0.20849423249924548, "3": 0.00013217298511887434, "2": 1.6132385026090834e-07, "1": 0}, "score": 4.791240922686327}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6263848753195913, "4": 0.3732760547159114, "3": 0.00033878068731960694, "2": 3.0739385385724843e-07, "1": 0}, "score": 4.626045468502701}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9977593597902752, "4": 0.0022402159757893047, "3": 4.323419547071621e-07, "2": 3.6502981053077023e-09, "1": 0}, "score": 4.997758908415758}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999963211539712, "4": 3.674001756823801e-05, "3": 2.7844621864816103e-08, "1": 0, "2": 0}, "score": 4.999963204292429}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7088432946073664, "5": 0.28978506093295636, "3": 0.0013698596358157214, "2": 1.7680204978667423e-06, "1": 0}, "score": 4.288411670102431}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996562526646581, "4": 0.00034359136470320646, "3": 1.2284677375311156e-07, "1": 0, "2": 0}, "score": 4.999656162930361}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9974889690258174, "4": 0.002509721219337447, "3": 1.3182492862150536e-06, "2": 5.729898615536173e-09, "1": 0}, "score": 4.99748762512813}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983752955635553, "4": 0.0016241502874355495, "3": 5.225856202630213e-07, "1": 0, "2": 0}, "score": 4.998374804490028}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7076999532213132, "5": 0.2912571864209324, "3": 0.0010415992568290494, "2": 1.1493902196507739e-06, "1": 0}, "score": 4.290213320803598}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"5": 0.799029646019452, "4": 0.20077556235301317, "3": 0.00019384707169442378, "2": 8.937676454251959e-07, "1": 7.798681991371298e-08}, "score": 4.798833755724827}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.993652705124236, "4": 0.006345229552393491, "3": 1.9896436611711378e-06, "2": 1.4142986350711112e-08, "1": 0}, "score": 4.993650748340613}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8708723226137566, "5": 0.12629875590385228, "3": 0.002825046936023951, "2": 3.7552601281791954e-06, "1": 8.291150522964737e-08}, "score": 4.123465954204098}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982756159615217, "4": 0.0017241132821425149, "3": 2.5848685379925515e-07, "1": 0, "2": 0}, "score": 4.9982753697229905}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8355562151220405, "4": 0.16439963772199262, "3": 4.401980111218882e-05, "2": 5.571468947038189e-08, "1": 0}, "score": 4.835512143747777}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9977911654732093, "4": 0.00220833818234832, "3": 4.617824242384828e-07, "1": 0, "2": 0}, "score": 4.997790738176446}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997064104058621, "4": 0.00029349175825303214, "3": 3.432070570630608e-08, "1": 0, "2": 0}, "score": 4.99970643958169}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9768878995304158, "4": 0.023077012195267598, "3": 3.4796560927140345e-05, "2": 2.0094019710460293e-07, "1": 2.3415210602736948e-08}, "score": 4.97685269664229}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995931240964598, "4": 0.00040672336357333496, "3": 6.330604593221674e-08, "1": 0, "2": 0}, "score": 4.99959314998803}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999542716355735, "4": 4.565182379607941e-05, "3": 1.3686580632875214e-08, "1": 0, "2": 0}, "score": 4.99995432080017}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9452758077673403, "5": 0.03047586561245429, "3": 0.02416225437609071, "2": 8.543164290310493e-05, "1": 5.413336607821207e-07}, "score": 4.006141124559189}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9731260396813443, "4": 0.02686535877913404, "3": 8.432325196176275e-06, "2": 2.893250885931558e-08, "1": 0}, "score": 4.973117686001848}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5956239663375894, "5": 0.4034346347733175, "3": 0.0009393785672429759, "2": 1.8888016077002286e-06, "1": 8.923888159618503e-08}, "score": 4.4024912279040915}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995335702821776, "4": 0.0004662409487795194, "3": 1.7595580172646314e-07, "1": 0, "2": 0}, "score": 4.999533407133638}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9934779375807998, "4": 0.00651651014615604, "3": 5.516207394650024e-06, "2": 5.0713433545279685e-08, "1": 0}, "score": 4.993472305394371}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9696863425229644, "3": 0.019888909781732154, "5": 0.010391463782621643, "2": 3.298812202261224e-05, "1": 7.865009496538055e-08}, "score": 3.990436339729901}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999536756430062, "4": 4.6288870672993705e-05, "3": 1.586508586020436e-08, "1": 0, "2": 0}, "score": 4.999953679398246}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991107317036185, "4": 0.0008888580579911565, "3": 3.0898008869658646e-07, "1": 0, "2": 0}, "score": 4.999110523891765}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999663107274963, "4": 3.35444880048757e-05, "3": 1.4374356736923623e-08, "1": 0, "2": 0}, "score": 4.9999664267589035}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997912364441444, "4": 0.00020858519313747559, "3": 4.6526211267069184e-08, "1": 0, "2": 0}, "score": 4.999791321726929}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9290578879498346, "4": 0.07089808894773943, "3": 4.334799964903399e-05, "2": 1.2038125566947745e-07, "1": 0}, "score": 4.929014814532184}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9373984940620459, "5": 0.05198760261890893, "3": 0.010552519841964814, "2": 6.067486690052981e-05, "1": 4.1799410808977694e-07}, "score": 4.0413124910668925}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7299822939477136, "4": 0.26988465903881453, "3": 0.00013270605346435332, "2": 2.3902301322645797e-07, "1": 1.766432090218379e-08}, "score": 4.729849118361596}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9218291557928006, "4": 0.07815612892857862, "3": 1.4635645971257695e-05, "2": 4.6849242360199936e-08, "1": 0}, "score": 4.921814456668564}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9301410664340996, "4": 0.06979345789772692, "3": 6.509472768311745e-05, "2": 2.6073324554263763e-07, "1": 4.3943021857263625e-08}, "score": 4.930075389342336}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9671722095336572, "4": 0.032798089901438066, "3": 2.9556850901051624e-05, "2": 1.400346422925182e-07, "1": 0}, "score": 4.967142376171938}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8888623432020609, "4": 0.11109809824386788, "3": 3.9379270876334746e-05, "2": 7.463024372728436e-08, "1": 0}, "score": 4.888822907688638}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9890200901165195, "4": 0.010973785354449109, "3": 6.083867270270867e-06, "2": 1.6481455453691043e-08, "1": 0}, "score": 4.989013997200999}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999074278310677, "4": 9.252182456799849e-05, "3": 2.3421111979351055e-08, "1": 0, "2": 0}, "score": 4.9999074313307155}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9984797498527728, "4": 0.0015197263397062181, "3": 4.3220405961904675e-07, "1": 0, "2": 0}, "score": 4.998479409112883}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9200155931560703, "3": 0.07854610513829938, "5": 0.0013234694755412408, "2": 0.00011470086413343555, "1": 1.7560792952792194e-07}, "score": 3.92254743921184}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995573928294658, "4": 0.00044254725865437234, "3": 1.8933556745853148e-08, "1": 0, "2": 0}, "score": 4.999557414856096}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8701710129856743, "4": 0.1298044878752198, "3": 2.446045074582344e-05, "2": 1.738249798285441e-08, "1": 0}, "score": 4.8701465363091545}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9066010475545921, "5": 0.09190595987336922, "3": 0.0014915800271019938, "2": 1.3485724087973519e-06, "1": 0}, "score": 4.090411688485314}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9894290869952809, "4": 0.010569920504385839, "3": 9.186919243583945e-07, "1": 0, "2": 0}, "score": 4.98942824133148}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9544865825124977, "5": 0.03799935853713276, "3": 0.007490415567611079, "2": 2.3303569772680965e-05, "1": 2.6383049616234466e-07}, "score": 4.030461546653033}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.716162917139489, "4": 0.28353965189607216, "3": 0.00029677834824176093, "2": 5.622686929343854e-07, "1": 0}, "score": 4.715865078930484}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8694913878084427, "4": 0.1303934318508637, "3": 0.00011491130362626615, "2": 1.332587646604757e-07, "1": 0}, "score": 4.869376328029729}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997173703072987, "4": 0.0002825265583325426, "3": 3.337011826960058e-08, "1": 0, "2": 0}, "score": 4.999717406681717}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9958972663026125, "4": 0.0041021678545338745, "3": 6.071657614825723e-07, "1": 0, "2": 0}, "score": 4.995896617983506}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9004658936376009, "3": 0.07610630241507407, "5": 0.023039003383833846, "2": 0.0003874666799863413, "1": 1.1845921734963149e-06}, "score": 3.9461542057935572}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9456632611771447, "5": 0.047339880461741715, "3": 0.006989788365131441, "2": 6.814274192192092e-06, "1": 3.973895087080436e-08}, "score": 4.040336353043333}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8562889597524485, "5": 0.12966332442586506, "3": 0.014034116793567723, "2": 1.3467704470412694e-05, "1": 5.032846577162408e-08}, "score": 4.115602130601176}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.984874306073358, "4": 0.015121661903775714, "3": 4.041757240658915e-06, "2": 1.2312362475661533e-08, "1": 0}, "score": 4.984870217978218}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8100837350935074, "5": 0.09695244290837973, "3": 0.09166010998300624, "2": 0.001298910685511093, "1": 4.347406924142735e-06}, "score": 4.002681470550759}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9643532949256669, "4": 0.03563477471725069, "3": 1.1804296294548405e-05, "2": 2.9757846256907467e-08, "1": 0}, "score": 4.964341523982605}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8472425599025364, "4": 0.15238450715273755, "3": 0.0003706734765511894, "2": 2.058833495235161e-06, "1": 1.392334244074724e-07}, "score": 4.846867403057442}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9897964891503416, "4": 0.010199169332483287, "3": 4.229389083672692e-06, "2": 1.1587974008600634e-08, "1": 0}, "score": 4.989792336099147}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982404554168182, "4": 0.0017590056520748742, "3": 4.882569660050256e-07, "1": 0, "2": 0}, "score": 4.9982400177448065}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9526115433103467, "4": 0.04737322894618615, "3": 1.5193072356874981e-05, "2": 5.6620597755366924e-08, "1": 0}, "score": 4.952596216087796}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7069849503116753, "4": 0.2928106864858609, "3": 0.00020384268776644384, "2": 5.274213933744455e-07, "1": 2.701963535173657e-08}, "score": 4.706779947743764}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9973715604123196, "4": 0.0026280871941759543, "3": 2.894900239825963e-07, "1": 0, "2": 0}, "score": 4.997371333660424}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8509125220442834, "4": 0.14904832451721053, "3": 3.9054400467469864e-05, "2": 4.984184224341265e-08, "1": 0}, "score": 4.850873409819867}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999461661890916, "4": 5.36902573652316e-05, "3": 1.2844540239238033e-08, "1": 0, "2": 0}, "score": 4.999946284046533}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9326860368853594, "5": 0.06491923630740859, "3": 0.002382556995885309, "2": 1.1874693724467123e-05, "1": 1.2142573446739186e-07}, "score": 4.062512576504799}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9162835003445063, "5": 0.06814992645525811, "3": 0.015517257303177502, "2": 4.882607812656788e-05, "1": 2.6095287538657315e-07}, "score": 4.052534246160507}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9981495828367442, "4": 0.0018500270839982744, "3": 3.5531077780503926e-07, "2": 5.773386578031401e-09, "1": 0}, "score": 4.998149244920624}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7658196812661451, "5": 0.2303643944684418, "3": 0.0037826706411303967, "2": 3.283035543430293e-05, "1": 3.8957322183366745e-07}, "score": 4.226514902029339}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9663606478350923, "4": 0.033634700229552, "3": 4.617011147480273e-06, "2": 2.522071894189825e-08, "1": 0}, "score": 4.966355989759532}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.91439922870533, "4": 0.0855313075404138, "3": 6.879496492037177e-05, "2": 5.064090981230968e-07, "1": 5.1527767490824106e-08}, "score": 4.914329367694579}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8264489996810417, "5": 0.1728578497486544, "3": 0.0006927509519923808, "2": 3.82865149439645e-07, "1": 0}, "score": 4.172164335950661}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8768499902378847, "4": 0.12309812222128391, "3": 5.1729155460268064e-05, "2": 1.4896879238776967e-07, "1": 0}, "score": 4.8767979714012775}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5706878450409502, "4": 0.42910162499819365, "3": 0.0002102145252212402, "2": 3.026096941254642e-07, "1": 0}, "score": 4.570477032613247}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999315050358871, "4": 6.842023115153208e-05, "3": 1.3338129815868441e-08, "1": 0, "2": 0}, "score": 4.999931553088387}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992564006071603, "4": 0.0007434802916108473, "3": 1.0757000414171355e-07, "1": 0, "2": 0}, "score": 4.999256304559805}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7940043731536341, "5": 0.20018258578004774, "3": 0.00577093307556289, "2": 4.1221153454869075e-05, "1": 5.991055763628001e-07}, "score": 4.194327468995024}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7127388463974837, "4": 0.2752658007336689, "2": 0.01191721363646603, "5": 7.496599104515576e-05, "1": 3.037517463541682e-06}, "score": 3.263492479806586}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.662477621871122, "5": 0.3350486278266287, "3": 0.002467923919986109, "2": 5.58825211707798e-06, "1": 1.1103803907178107e-07}, "score": 4.332569236555216}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995824038175678, "4": 0.0004174493660292956, "3": 5.0346234856100383e-08, "1": 0, "2": 0}, "score": 4.9995824499012205}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.994742523163904, "4": 0.005256546640860123, "3": 9.297389398910944e-07, "1": 0, "2": 0}, "score": 4.99474159387886}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.794545329905855, "5": 0.20410322667635503, "3": 0.0013496405246866126, "2": 1.658030675358207e-06, "1": 0}, "score": 4.202750299461219}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6493056356028319, "4": 0.350496660629784, "3": 0.00019744332042521747, "2": 1.9037081669451805e-07, "1": 0}, "score": 4.649107857027747}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6444282882854429, "5": 0.3546369105831757, "3": 0.0009334821656365245, "2": 1.1310264214076709e-06, "1": 0}, "score": 4.353701232839067}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9499574185225079, "4": 0.050039068933568694, "3": 3.333485848950172e-06, "1": 0, "2": 0}, "score": 4.949954255133639}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8389528768034351, "3": 0.15191263395425605, "5": 0.007445205580478018, "2": 0.0016878742196669875, "1": 1.309252754385784e-06}, "score": 3.852152880615909}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9574692503116911, "5": 0.04093956189312794, "3": 0.0015902351191547487, "2": 9.096199154643914e-07, "1": 0}, "score": 4.039347509228292}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9928924552224317, "4": 0.0071032816321919675, "3": 4.259654518139435e-06, "2": 2.8468717047047516e-08, "1": 0}, "score": 4.99288811383026}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5400377848107365, "4": 0.4597968580378102, "3": 0.00016514445206514128, "2": 1.976457599002958e-07, "1": 0}, "score": 4.539872253194187}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951590861758658, "4": 0.004840244708133362, "3": 6.680104632396684e-07, "2": 1.6689369000859816e-09, "1": 0}, "score": 4.995158414266857}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.942974997958254, "4": 0.05702283940996813, "3": 2.0796457318153026e-06, "2": 3.727366070683287e-09, "1": 0}, "score": 4.942972985596584}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9996293369325348, "4": 0.00037047277415140514, "3": 8.995115825311793e-08, "1": 0, "2": 0}, "score": 4.999629347286341}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7637286523374246, "5": 0.23329223122879475, "3": 0.002973243007985433, "2": 5.8600641929911655e-06, "1": 5.089098708960414e-08}, "score": 4.230307106776179}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.989633704275604, "4": 0.010363927621002224, "3": 2.299023707831483e-06, "2": 6.290042559756227e-09, "1": 0}, "score": 4.989631454810417}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992803209932531, "4": 0.0007196120576379478, "3": 5.1488157869474944e-08, "1": 0, "2": 0}, "score": 4.999280284954919}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9686487266611872, "4": 0.031341474332658124, "3": 9.715364077757152e-06, "2": 4.6976845761373536e-08, "1": 0}, "score": 4.968638952858789}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9490044891338442, "5": 0.04051080703884176, "3": 0.010435055706905463, "2": 4.799498652054729e-05, "1": 8.960837117887303e-07}, "score": 4.029977095801925}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998230540167875, "4": 0.00017677708957663594, "3": 5.456435533914206e-08, "1": 0, "2": 0}, "score": 4.999823113761489}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5629249294297074, "4": 0.4367988269976448, "3": 0.0002758020940484288, "2": 3.131968281863428e-07, "1": 0}, "score": 4.562648573119558}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995784717679996, "4": 0.00042142868002471097, "3": 7.865080281942046e-08, "1": 0, "2": 0}, "score": 4.999578414009558}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9693757280506601, "4": 0.030611852757689073, "3": 1.2241337671061961e-05, "2": 6.793258639861215e-08, "1": 0}, "score": 4.969363457401597}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7776042035893638, "5": 0.20710292232185976, "3": 0.0150778997496157, "2": 0.00021321382980993013, "1": 1.6474844650869028e-06}, "score": 4.191593674114082}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9249217681678968, "4": 0.0750265220968092, "3": 5.1397552673126695e-05, "2": 2.2113200633864194e-07, "1": 1.2716823945898154e-08}, "score": 4.92486996264931}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5265462378955846, "5": 0.472917558787219, "3": 0.0005354468103967064, "2": 8.147316839974954e-07, "1": 1.2643090203280102e-08}, "score": 4.472380411107541}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6380481425129166, "4": 0.36146354000282566, "3": 0.0004868154302715634, "2": 1.430588013442121e-06, "1": 0}, "score": 4.637558511470357}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.752258044207309, "4": 0.2474691379252516, "3": 0.00027213154153082593, "2": 6.834973895697604e-07, "1": 0}, "score": 4.751984547798002}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7258616406040113, "3": 0.2667434883919516, "5": 0.0045286182866408, "2": 0.0028622936501043043, "1": 4.0192389064968194e-06}, "score": 3.7320485010008357}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.996778766142317, "4": 0.0032202154877612197, "3": 9.737930794206195e-07, "2": 4.390274865887024e-09, "1": 0}, "score": 4.996777823625767}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9040183103347579, "4": 0.09592560843973155, "3": 5.58481587926305e-05, "2": 1.1347219590897224e-07, "1": 0}, "score": 4.903962343340518}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984533674707414, "4": 0.0015456038555133143, "3": 1.0454553770025638e-06, "2": 8.92389791338046e-09, "1": 0}, "score": 4.998452278501825}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9229732467521102, "5": 0.06892365749690631, "3": 0.0080812767929771, "2": 2.1485914007182357e-05, "1": 2.824218392112529e-07}, "score": 4.0607985646881515}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6087985221000155, "5": 0.3903719212724263, "3": 0.0008278912936999541, "2": 1.4667859198865648e-06, "1": 3.3126873359172045e-08}, "score": 4.389541061464564}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9959680974332902, "4": 0.004030313961414, "3": 1.587043034342009e-06, "2": 1.0302626234375574e-08, "1": 0}, "score": 4.995966481079894}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6924485636478918, "5": 0.3068721707585271, "3": 0.0006788794409495148, "2": 2.5911781357625866e-07, "1": 0}, "score": 4.306192811979099}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9623962334833437, "4": 0.03759669993967204, "3": 6.843084347296179e-06, "1": 0, "2": 0}, "score": 4.962389605485987}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999002763027385, "4": 9.956140186095312e-05, "3": 3.8440278800346716e-08, "1": 0, "2": 0}, "score": 4.99990036170524}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5177243092126714, "2": 0.4776600939335655, "4": 0.004380326561293937, "1": 0.0002199885628519229, "5": 1.526101531374263e-05}, "score": 2.5263107677205094}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9707959858762027, "4": 0.02920081672689246, "3": 3.1470186928641834e-06, "1": 0, "2": 0}, "score": 4.97079288776432}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9307056473097258, "5": 0.06499935059386658, "3": 0.004288145173613499, "2": 6.614885961011501e-06, "1": 5.819025128112958e-08}, "score": 4.060697812236663}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9414172936910528, "5": 0.05476205784071413, "3": 0.0038100182493475444, "2": 1.0472937593393545e-05, "1": 9.927540305027902e-08}, "score": 4.0509307988442576}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7119503308824942, "5": 0.28712988632703923, "3": 0.0009171229648377904, "2": 2.480751548365709e-06, "1": 6.501849949034809e-08}, "score": 4.286207639447185}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7882749804773497, "4": 0.1998957096874496, "2": 0.011742764679674165, "5": 8.155947901742806e-05, "1": 4.9561516271616495e-06}, "score": 3.1883061572222733}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9986643413870262, "4": 0.0013351254787150482, "3": 5.314838634608441e-07, "1": 0, "2": 0}, "score": 4.998663811551353}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9374026842426794, "4": 0.06257273117577566, "3": 2.4499937290213285e-05, "2": 4.3946669279443707e-08, "1": 0}, "score": 4.937378134561077}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997540680162295, "4": 0.0002457927148005534, "3": 4.485400297123285e-08, "1": 0, "2": 0}, "score": 4.999754117553979}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9072818476549757, "4": 0.09270111300091892, "3": 1.6911680853892408e-05, "2": 4.161355006495735e-08, "1": 0}, "score": 4.907264930816898}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5231939983230655, "5": 0.4763244925355181, "3": 0.00048014299124412636, "2": 1.3580645456819905e-06, "1": 3.4688729535482215e-08}, "score": 4.475841516690133}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7851375214363329, "5": 0.21121776840147846, "3": 0.0036294632741441344, "2": 1.5013991874627527e-05, "1": 1.1494500963882077e-07}, "score": 4.207557956790258}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9265701509879999, "4": 0.07340555977330167, "3": 2.4118074965682867e-05, "2": 5.6942035931592997e-08, "1": 0}, "score": 4.926546024860621}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5057452474563433, "5": 0.4935427488750238, "3": 0.0007059232764217654, "2": 5.870287191634699e-06, "1": 1.4746750360230473e-07}, "score": 4.492824673491021}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992590211105441, "4": 0.0007408362072124111, "3": 5.728654829703635e-08, "1": 0, "2": 0}, "score": 4.999259049156417}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7893233812022594, "4": 0.2103263935224232, "3": 0.0003483037200701707, "2": 1.7718825305384301e-06, "1": 5.46113554797461e-08}, "score": 4.78897144488376}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.996482031203543, "4": 0.003515776034977225, "3": 2.1984192029284353e-06, "2": 2.224367807873311e-08, "1": 0}, "score": 4.996479760493803}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7530387889192524, "5": 0.24452209647984807, "3": 0.002434365819758312, "2": 4.482928688549109e-06, "1": 8.278110517218322e-08}, "score": 4.2420785607770455}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994529542441214, "4": 0.0005466959828977758, "3": 3.147091367787257e-07, "1": 0, "2": 0}, "score": 4.999452674579637}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9913554062404177, "4": 0.008641074849727938, "3": 3.4279779142512725e-06, "2": 1.6516102877205535e-08, "1": 0}, "score": 4.991352019002588}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9766101687584203, "5": 0.02112981083144043, "3": 0.002254263425415792, "2": 5.596733130516607e-06, "1": 1.0479508133366181e-07}, "score": 4.018864040600654}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5285252278476741, "4": 0.47128845567261, "3": 0.00018607569586938385, "2": 1.8553913626159784e-07, "1": 0}, "score": 4.528338810261458}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.874452607340029, "5": 0.12480328515947936, "3": 0.0007438689359551651, "2": 3.3662610608917343e-07, "1": 0}, "score": 4.124058730805919}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957487851064629, "4": 0.004251065591758939, "3": 1.999073155623247e-07, "1": 0, "2": 0}, "score": 4.995748534808758}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9918539384537535, "4": 0.00814524954160218, "3": 7.549962912206361e-07, "1": 0, "2": 0}, "score": 4.991853240001382}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9710906535782717, "4": 0.028875491171975128, "3": 3.340296130785595e-05, "2": 3.906212173838403e-07, "1": 3.722571689996228e-08}, "score": 4.971056381431464}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7824479940925907, "4": 0.21731981686425558, "3": 0.00023132821771361408, "2": 8.117146295464573e-07, "1": 0}, "score": 4.782215080860834}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8934445014195838, "3": 0.09902830110034992, "5": 0.007135583153490236, "2": 0.000391024359268512, "1": 6.157394091576857e-07}, "score": 3.907323388504847}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996548227073943, "4": 0.00034494554292024043, "3": 1.38531236839682e-07, "1": 0, "2": 0}, "score": 4.999654777362426}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941531889182448, "4": 0.005846257886153298, "3": 5.111514045109629e-07, "1": 0, "2": 0}, "score": 4.994152719565194}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8780854733748341, "3": 0.11686622200890838, "5": 0.004673114093920771, "2": 0.0003745094581195533, "1": 5.461162345865002e-07}, "score": 3.887056219578534}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9954871709526005, "4": 0.004511369558764591, "3": 1.5127429981680855e-06, "1": 0, "2": 0}, "score": 4.99548560519565}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9464561263243395, "5": 0.033584783050443955, "3": 0.019912713139482324, "2": 4.594001657071356e-05, "1": 2.9126567901138135e-07}, "score": 4.013579318066126}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9803376567072254, "4": 0.01965879417639329, "3": 3.497811747490578e-06, "1": 0, "2": 0}, "score": 4.980334209191166}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9500204626385486, "5": 0.026601709455900225, "3": 0.02332359896178065, "2": 5.396952621746064e-05, "1": 1.46948889661969e-07}, "score": 4.003169730951511}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"2": 0.8579680739799973, "3": 0.1408610127398346, "4": 0.0006360358043887487, "1": 0.0005344325650526162, "5": 4.2014455765255155e-07}, "score": 2.1415999157241195}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9978284294783396, "4": 0.002170696923691692, "3": 8.137041411282179e-07, "2": 4.92643615379161e-09, "1": 0}, "score": 4.99782766076931}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9738509722010057, "4": 0.02613066630911369, "3": 1.814301354513792e-05, "2": 5.993603060840793e-08, "1": 8.883501896206274e-09}, "score": 4.973832828405602}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99948486922544, "4": 0.0005144319375364319, "3": 6.624697105869331e-07, "2": 9.721100545867786e-09, "1": 0}, "score": 4.999484213945997}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9959742494476314, "4": 0.004021470689887247, "3": 4.216226602283012e-06, "2": 4.770879855415954e-08, "1": 0}, "score": 4.995969953666325}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7849870563984995, "5": 0.20936010902639363, "3": 0.005634623208546272, "2": 1.7905332221653076e-05, "1": 1.805769200658987e-07}, "score": 4.203689158976959}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9995099975604267, "4": 0.0004894956415083246, "3": 5.040380881521424e-07, "1": 0, "2": 0}, "score": 4.999509496280962}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7432839948799037, "4": 0.25634786736975573, "3": 0.0003671307890361925, "2": 9.973780014230217e-07, "1": 2.305892363287427e-08}, "score": 4.742914790146857}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998908601961818, "4": 0.00010898023744689849, "3": 4.616647276647959e-08, "1": 0, "2": 0}, "score": 4.99989092741724}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9345715088876793, "5": 0.06279333133999514, "3": 0.002615413677248805, "2": 1.9134683109546258e-05, "1": 3.561716711481276e-07}, "score": 4.060138595131307}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9674886697495026, "4": 0.03249276596872447, "3": 1.8421649163686966e-05, "2": 7.253185443963771e-08, "1": 0}, "score": 4.96747017085702}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9915646975078309, "4": 0.00843296709778396, "3": 2.1895314210939642e-06, "2": 3.0866666171639e-08, "1": 0}, "score": 4.991562560269101}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8251687319366271, "4": 0.17461584315043832, "3": 0.00021507688265797432, "2": 2.690106142350932e-07, "1": 0}, "score": 4.824953182220263}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9312279103492846, "4": 0.06875824653698262, "3": 1.3670094422138537e-05, "2": 3.721536958900703e-08, "1": 0}, "score": 4.931214292286695}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9975831532882801, "4": 0.002416442165822216, "3": 3.3412522135365194e-07, "1": 0, "2": 0}, "score": 4.99758288941352}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9635638292947208, "4": 0.03643126661886219, "3": 4.807578648860138e-06, "2": 1.7657556762693664e-08, "1": 0}, "score": 4.963559062377794}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7988490777350428, "5": 0.20010328914926157, "3": 0.0010452481057239898, "2": 2.3532269536038803e-06, "1": 2.8389911038982276e-08}, "score": 4.1990532500953055}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5608198488924496, "5": 0.4384061566471383, "3": 0.0007725355738201755, "2": 1.4431851172759747e-06, "1": 4.1340590450736474e-08}, "score": 4.437630599460852}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9955230817094682, "4": 0.004476279707410445, "3": 6.29247610698859e-07, "2": 5.310685043172429e-09, "1": 0}, "score": 4.995522445847292}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9932823075583881, "4": 0.006716672572349173, "3": 1.027903774381243e-06, "2": 4.505941399564282e-09, "1": 0}, "score": 4.993281258186534}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5568954548159978, "4": 0.4423710807148778, "3": 0.0007314589182878821, "2": 1.7983823348478345e-06, "1": 0}, "score": 4.55616051435198}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.894084991084633, "4": 0.10551340210115474, "3": 0.00038723891654752286, "2": 1.3882493111930692e-05, "1": 3.8674278621028665e-07}, "score": 4.893668915124456}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9392781258190843, "4": 0.06069536153887848, "3": 2.6319222295158446e-05, "2": 1.0647794100119312e-07, "1": 0}, "score": 4.93925167530114}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998702477485516, "4": 0.000129706156569566, "3": 3.396429537971525e-08, "1": 0, "2": 0}, "score": 4.999870225913265}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996390970411464, "4": 0.00036064913408565235, "3": 1.9914691863936908e-07, "1": 0, "2": 0}, "score": 4.999638952552335}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6213512729797724, "5": 0.37665086807018505, "3": 0.0019942574568597663, "2": 3.177534424849082e-06, "1": 1.3414131542015398e-07}, "score": 4.374649961700624}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9946075952933915, "4": 0.005389131708935337, "3": 3.291158261423314e-06, "1": 0, "2": 0}, "score": 4.994604286072532}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9348948087810349, "4": 0.06498503931259572, "3": 0.00011921809633080344, "2": 4.160555716124749e-07, "1": 0}, "score": 4.934775242557618}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9496942455317827, "4": 0.05026393284138415, "3": 4.165200713484759e-05, "2": 3.818706466553883e-08, "1": 0}, "score": 4.949652641965866}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9684995449359382, "4": 0.031458942375112146, "3": 4.121422888276898e-05, "2": 8.479400435576335e-08, "1": 0}, "score": 4.968458368045733}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5272181706796439, "4": 0.47244119255273764, "3": 0.00033985534050318806, "2": 7.359644654659486e-07, "1": 4.776961829746771e-08}, "score": 4.526876698885866}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7923422632101396, "3": 0.19959708887614205, "5": 0.004583770345380446, "2": 0.003472361044913757, "1": 4.259609792001814e-06}, "score": 3.7980291286609646}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9239317811409994, "3": 0.07420499596579747, "5": 0.0017746903890028627, "2": 8.836081109659858e-05, "1": 1.2419971029725938e-07}, "score": 3.927392596753509}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9479952853490289, "4": 0.051993508746028115, "3": 1.1052532176593395e-05, "2": 3.2032462347253935e-08, "1": 0}, "score": 4.947984283780629}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6050603946898114, "5": 0.39426137551415535, "3": 0.0006772933975379973, "2": 7.635914058027666e-07, "1": 0}, "score": 4.393582622947673}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6529013520198966, "5": 0.34633024285929187, "3": 0.0007679896511288771, "2": 3.4872715895203797e-07, "1": 0}, "score": 4.345561578817496}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997410780860659, "4": 0.0002587679095830741, "3": 1.1778769828523874e-07, "1": 0, "2": 0}, "score": 4.99974099650564}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7974645154871617, "4": 0.20237847419827604, "3": 0.00015681935816237974, "2": 2.2460848883702392e-07, "1": 0}, "score": 4.7973072200809685}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999352000996042, "4": 6.475873260446942e-05, "3": 1.1332410848859916e-08, "1": 0, "2": 0}, "score": 4.9999352186006405}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8433168428944157, "4": 0.15660161227192249, "3": 8.126671783097442e-05, "2": 2.4697369597936295e-07, "1": 0}, "score": 4.843235108489335}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8290359908602772, "4": 0.1709012285806912, "3": 6.272377472373944e-05, "2": 6.755613196339341e-08, "1": 0}, "score": 4.828973123043737}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.702500005461401, "5": 0.29410727418942284, "3": 0.0033792482684738808, "2": 1.3153061667690862e-05, "1": 1.955854438616632e-07}, "score": 4.2907011689235715}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984285257607705, "4": 0.0015708061815192305, "3": 6.437547540910038e-07, "2": 1.6411280437551384e-09, "1": 0}, "score": 4.998427901349961}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8568956754997353, "4": 0.1430763178251074, "3": 2.767237319622388e-05, "2": 6.396389841560388e-08, "1": 0}, "score": 4.856868106842805}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99873354712917, "4": 0.0012660578008788007, "3": 3.027374223651478e-07, "1": 0, "2": 0}, "score": 4.998733336607322}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6793855107643957, "2": 0.31261436773713747, "4": 0.007933380830126537, "1": 5.172367246039337e-05, "5": 1.505845395338678e-05}, "score": 2.6952456952905015}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998709628860046, "4": 0.00012884376649935803, "3": 9.715171579324705e-08, "1": 0, "2": 0}, "score": 4.999870961917656}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.989916915611533, "4": 0.010077107619749042, "3": 5.83613380527849e-06, "2": 1.408924636065063e-08, "1": 0}, "score": 4.989911176568206}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999953079650794, "4": 4.682665340280809e-05, "3": 2.3151922835838788e-08, "1": 0, "2": 0}, "score": 4.999953127039445}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9974710621648298, "4": 0.0025284535707040335, "3": 4.879226245083487e-07, "1": 0, "2": 0}, "score": 4.997470570593299}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"4": 0.961379290246377, "3": 0.019664519650846073, "5": 0.01891439512494122, "2": 4.135695302856315e-05, "1": 2.0605164411280377e-07}, "score": 3.9991665432197663}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8170862504401796, "5": 0.1789574340541706, "3": 0.003929881524472646, "2": 2.5806671866268766e-05, "1": 3.245241115060765e-07}, "score": 4.174975018593478}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8140363971790988, "5": 0.18440460413079568, "3": 0.0015577091976719747, "2": 1.2336738136000954e-06, "1": 2.7688297110816988e-08}, "score": 4.182844349664076}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952522531507279, "4": 0.004746926134467999, "3": 7.681467817422588e-07, "2": 5.244908712084231e-09, "1": 0}, "score": 4.99525152161253}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5746721929330624, "4": 0.4250885835050572, "3": 0.00023760569545330727, "2": 1.383660547499434e-06, "1": 0}, "score": 4.574431954451856}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7140139849997418, "4": 0.28589730673572744, "3": 8.835763016465624e-05, "2": 3.095488258732482e-07, "1": 0}, "score": 4.71392503760392}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999574899895761, "4": 4.2463358790563133e-05, "3": 1.1572664828558926e-08, "1": 0, "2": 0}, "score": 4.999957513494389}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5650369227335655, "5": 0.43397812906977046, "3": 0.000984458809268593, "2": 4.960126036299861e-07, "1": 0}, "score": 4.432992675366629}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9978251025243363, "4": 0.002174568554207961, "3": 2.866817848238323e-07, "1": 0, "2": 0}, "score": 4.997824857990344}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9690394576028717, "4": 0.030952323808639423, "3": 7.951412278346664e-06, "1": 0, "2": 0}, "score": 4.969031765092828}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9036721050860101, "4": 0.09626985898306235, "3": 5.769892589277526e-05, "2": 1.8969562936338233e-07, "1": 0}, "score": 4.903614159879724}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7007424452109949, "4": 0.29884913444554695, "3": 0.0004041149058589519, "2": 4.1908876366947275e-06, "1": 1.421434610868424e-07}, "score": 4.700329502774937}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9967915547962471, "4": 0.003206796869508865, "3": 1.627157386878309e-06, "2": 6.2297664052155534e-09, "1": 0}, "score": 4.996789930078437}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975045089277639, "4": 0.0024942030989896233, "3": 1.2458394477931634e-06, "2": 7.341093699784212e-09, "1": 0}, "score": 4.997503283111966}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9954950886908506, "4": 0.004503839607059906, "3": 1.061958195346311e-06, "1": 0, "2": 0}, "score": 4.995494036432644}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6285302573165304, "5": 0.3667751459604984, "3": 0.004672831846353462, "2": 2.1488062706016223e-05, "1": 2.325633909113339e-07}, "score": 4.362058656319845}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.761503218598432, "4": 0.23792980161852156, "3": 0.0005624749264945494, "2": 4.2786244081310026e-06, "1": 1.0763359680394203e-07}, "score": 4.760931953767756}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9638636502738869, "4": 0.03610332184534839, "3": 3.270331856637816e-05, "2": 2.5044212025137113e-07, "1": 3.321334778846144e-08}, "score": 4.963830385858187}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9834038618236094, "4": 0.016590245115407375, "3": 5.775111467564048e-06, "2": 6.490293440537666e-08, "1": 0}, "score": 4.983398009072175}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.854778156324254, "5": 0.10049196549521984, "3": 0.04396092973950935, "2": 0.0007657261183539105, "1": 2.60947110219936e-06}, "score": 4.0549917888074996}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8932125486693592, "4": 0.10674476157226982, "3": 4.257280026684491e-05, "2": 6.394874076793167e-08, "1": 0}, "score": 4.893169895317978}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8540039328443622, "5": 0.1336362128956629, "3": 0.012287681776584574, "2": 7.084639324779176e-05, "1": 7.616665313080131e-07}, "score": 4.12120462174374}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9466261610818548, "4": 0.05334878903459765, "3": 2.4899968986910235e-05, "2": 3.7784986339732315e-08, "1": 0}, "score": 4.946601291684896}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8182507819207668, "4": 0.18158316878722477, "3": 0.0001652817441417648, "2": 4.325382825176405e-07, "1": 0}, "score": 4.818084909166345}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.994109241757268, "4": 0.005888268484528221, "3": 2.4187963924770266e-06, "2": 1.302415664952749e-08, "1": 0}, "score": 4.994106854508782}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9967072354789404, "4": 0.0032922271432187116, "3": 4.84647264646897e-07, "1": 0, "2": 0}, "score": 4.9967068033886}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7291108287973819, "4": 0.2707558734708124, "3": 0.00013317719809298413, "2": 9.080994780648373e-08, "1": 0}, "score": 4.728977491647349}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.96384305080008, "4": 0.03614650556204741, "3": 1.0401619945047665e-05, "2": 2.474560350184496e-08, "1": 0}, "score": 4.963832616336557}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999057298562453, "4": 0.0009425373601606348, "3": 1.0278257522445711e-07, "1": 0, "2": 0}, "score": 4.999057257016903}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7646369369747412, "4": 0.23531898553434438, "3": 4.400562901806028e-05, "2": 4.291827976584794e-08, "1": 0}, "score": 4.764592867639245}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9059175513546383, "4": 0.09403442879441143, "3": 4.7751408217807055e-05, "2": 1.948002816299615e-07, "1": 0}, "score": 4.905869477056305}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8292302235810866, "5": 0.17011966122280864, "3": 0.0006495387905022346, "2": 6.047715823742898e-07, "1": 0}, "score": 4.16946890808199}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9418828925701154, "5": 0.055640801885390785, "3": 0.002474314230353287, "2": 1.921864018344469e-06, "1": 2.080684120977917e-08}, "score": 4.05316258409248}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999135066767632, "4": 8.645080795120899e-05, "3": 1.2889742460312424e-08, "1": 0, "2": 0}, "score": 4.999913523410002}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998842112669446, "4": 0.0011576212799477572, "3": 2.0793735094374017e-07, "1": 0, "2": 0}, "score": 4.998841962778053}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7184959214197829, "5": 0.28030592022595363, "3": 0.0011958556795588428, "2": 2.2183874497588207e-06, "1": 0}, "score": 4.279105651296544}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8055440349606992, "5": 0.19392144977096157, "3": 0.0005343143082115722, "2": 2.1730716008429984e-07, "1": 0}, "score": 4.1933866976871315}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9318502436373051, "5": 0.06670042194957393, "3": 0.001448360575193999, "2": 8.640147470008462e-07, "1": 0}, "score": 4.065250340510885}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999856212553752, "4": 1.4295896784784378e-05, "3": 3.8255943351493985e-09, "1": 0, "2": 0}, "score": 4.999985696450897}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998251993094213, "4": 0.00017466477369397206, "3": 7.923323439064113e-08, "1": 0, "2": 0}, "score": 4.999825176749927}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.860034151049802, "5": 0.13751217779711908, "3": 0.002450347077924461, "2": 3.307324511871931e-06, "1": 4.429269818519528e-08}, "score": 4.135055079472381}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.932622890582262, "4": 0.06736673020967653, "3": 1.0204395491078882e-05, "2": 1.6613985438326005e-08, "1": 0}, "score": 4.932612800496825}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.941725455875698, "4": 0.05824818184411668, "3": 2.631527470789063e-05, "2": 3.990133719312525e-08, "1": 0}, "score": 4.941699067488277}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992698423948916, "4": 0.0007299391379271999, "3": 1.627152656728972e-07, "1": 0, "2": 0}, "score": 4.999269735390827}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9535993579137311, "4": 0.046359520663748814, "3": 4.094257838950222e-05, "2": 8.400453932330738e-08, "1": 0}, "score": 4.953558337761345}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9397276309626755, "3": 0.05540505189200646, "5": 0.004753563650576369, "2": 0.00011341272041383852, "1": 2.440362639379382e-07}, "score": 3.949120949287009}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9992093842714438, "4": 0.0007904941513609436, "3": 7.203721330454837e-08, "1": 0, "2": 0}, "score": 4.999209361735043}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9151335985689252, "5": 0.08286688117341294, "3": 0.0019988175465312716, "2": 6.877846890190228e-07, "1": 1.2959716775543587e-08}, "score": 4.080866649337397}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951642839053467, "4": 0.004834346594276572, "3": 1.4046477476904512e-06, "2": 8.615930185630321e-09, "1": 0}, "score": 4.995162818474128}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9943636538383738, "4": 0.00563561498950514, "3": 6.779671510218678e-07, "1": 0, "2": 0}, "score": 4.994363028776278}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8607034663270778, "5": 0.13072437237874746, "3": 0.00855695394246695, "2": 1.4952754912807056e-05, "1": 0}, "score": 4.122137544022283}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9150434669239652, "5": 0.08154269751755139, "3": 0.0034076887616242666, "2": 6.082717528010847e-06, "1": 7.151382852520814e-08}, "score": 4.078122628198583}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5665814677155518, "4": 0.4330299001064912, "3": 0.00038769368569294116, "2": 8.396086051044406e-07, "1": 0}, "score": 4.5661921507998}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997360765339272, "4": 0.0002637591979600218, "3": 5.6580071917355575e-08, "1": 0, "2": 0}, "score": 4.99973612761348}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9847315254076724, "4": 0.015264933640064426, "3": 3.4656616194000824e-06, "2": 1.664922779956457e-08, "1": 0}, "score": 4.984728084193447}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"4": 0.766261441524848, "5": 0.23142896481374198, "3": 0.0023070415258904585, "2": 2.513033421621529e-06, "1": 3.841480134221274e-08}, "score": 4.229116782134075}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996955661194009, "4": 0.0003042916321880219, "3": 9.800473922562177e-08, "1": 0, "2": 0}, "score": 4.999695512344862}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.778435066238918, "4": 0.2212551762251181, "3": 0.0003090263529732462, "2": 6.927982539371031e-07, "1": 2.9675145302529665e-08}, "score": 4.778124572041149}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9922630494820491, "4": 0.007731576434364026, "3": 5.311623635770879e-06, "2": 8.726364424959373e-09, "1": 0}, "score": 4.992257773723254}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996549418762527, "4": 0.0003447469114988596, "3": 2.0035400701287368e-07, "1": 0, "2": 0}, "score": 4.999654852342224}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8480174208042572, "5": 0.15069978500395123, "3": 0.0012808555831637326, "2": 1.7868343917075968e-06, "1": 0}, "score": 4.14941537842941}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8362029685651674, "4": 0.16369271462896667, "3": 0.00010413046227808779, "2": 1.46892986245752e-07, "1": 0}, "score": 4.836098577301509}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8526886448693524, "4": 0.14729365968360508, "3": 1.765838176099079e-05, "2": 1.3653212432008205e-08, "1": 0}, "score": 4.852670979143958}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993259185550465, "4": 0.0006740184995669038, "3": 5.93156887598938e-08, "1": 0, "2": 0}, "score": 4.999325862866608}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.990984503509442, "4": 0.009014697302358583, "3": 6.948728206480391e-07, "2": 1.4467719552844692e-09, "1": 0}, "score": 4.990983907684211}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9587158300884419, "3": 0.039287632668550405, "5": 0.001968452850226857, "2": 2.7970588795686142e-05, "1": 6.386099939509334e-08}, "score": 3.9626246855544522}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999690523188893, "4": 3.086295378371553e-05, "3": 2.1765101467407414e-08, "1": 0, "2": 0}, "score": 4.999969093514067}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9675474735628437, "4": 0.03243671885134829, "3": 1.570420573929645e-05, "2": 2.2067255030796044e-08, "1": 0}, "score": 4.967531803895328}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998912177632167, "4": 0.00010861000800155206, "3": 4.192908911266777e-08, "1": 0, "2": 0}, "score": 4.9998913061196575}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998748886795521, "4": 0.0012508286841505358, "3": 2.2172964777807415e-07, "1": 0, "2": 0}, "score": 4.998748727777985}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9631229609776917, "4": 0.036843557721978504, "3": 3.3212541411972756e-05, "2": 1.9698445893009864e-07, "1": 1.8081744478395464e-08}, "score": 4.963089351933011}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8633054593025734, "5": 0.12830787880626396, "3": 0.00834794064398746, "2": 3.805797130749319e-05, "1": 4.2790698061370446e-07}, "score": 4.119882566715345}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8629278544023897, "4": 0.1369139298301958, "3": 0.00015792205017482391, "2": 2.7343114549420334e-07, "1": 0}, "score": 4.8627694029921456}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994279501329514, "4": 0.0005718451042627383, "3": 1.803524220440579e-07, "1": 0, "2": 0}, "score": 4.999427794176925}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997096279661218, "4": 0.0002902160245650311, "3": 5.91548059270069e-08, "1": 0, "2": 0}, "score": 4.9997096656377025}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7029114607375473, "4": 0.29683718177885815, "3": 0.00025072495912932145, "2": 5.415968128820417e-07, "1": 2.6584965173409844e-08}, "score": 4.702659618040905}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9604180505371175, "5": 0.034999108123608985, "3": 0.0045762060386020315, "2": 6.3411272857328105e-06, "1": 0}, "score": 4.030410228776316}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7429383292979792, "4": 0.2568015940052609, "3": 0.0002595134568143876, "2": 5.548533457554976e-07, "1": 2.0316631512509544e-08}, "score": 4.742677636324411}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9920406740215222, "4": 0.00795845494781002, "3": 8.12013395499694e-07, "1": 0, "2": 0}, "score": 4.992039920555617}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9461951107938833, "4": 0.053791651523423856, "3": 1.3076863948121622e-05, "2": 3.558431094567669e-08, "1": 0}, "score": 4.946182081255891}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8986740228388608, "3": 0.07838310282860508, "5": 0.02240989671634205, "2": 0.0005308083100077507, "1": 1.9676787685894594e-06}, "score": 3.9429592627304393}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999486537207161, "4": 0.0005133772515072838, "3": 6.207012764838041e-08, "1": 0, "2": 0}, "score": 4.999486498596186}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.59629799813665, "5": 0.4034977368846525, "3": 0.0002040974463470794, "2": 1.2316018645084733e-07, "1": 0}, "score": 4.403293411012933}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986608928052768, "4": 0.0013389563657446577, "3": 1.5410063098228631e-07, "1": 0, "2": 0}, "score": 4.998660735437374}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.998785501401099, "4": 0.0012142817855206448, "3": 1.2362710745377484e-07, "1": 0, "2": 0}, "score": 4.998785470847087}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7497547694395957, "5": 0.2459409776719366, "3": 0.004291561612675227, "2": 1.2278743025148065e-05, "1": 1.5881624418635955e-07}, "score": 4.241624443428592}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.669247923040509, "5": 0.32673572998823613, "3": 0.004003160919718099, "2": 1.291593161084251e-05, "1": 1.4560927518778218e-07}, "score": 4.322706340557847}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9043503485172156, "4": 0.09554589223096957, "3": 0.00010322081804689564, "2": 3.29566560121549e-07, "1": 0}, "score": 4.904246657433522}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8526696642313728, "4": 0.14720837189764346, "3": 0.0001207229870728402, "2": 1.1061810170914893e-06, "1": 9.435524271584494e-08}, "score": 4.8525464802147855}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9877443211360014, "4": 0.012253663812184205, "3": 1.9355829707188536e-06, "2": 9.806896247747594e-09, "1": 0}, "score": 4.9877424347473}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.958606602146918, "4": 0.04136698417524015, "3": 2.6184916999778037e-05, "2": 1.1370084549793772e-07, "1": 0}, "score": 4.958580300122473}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5037413938680918, "5": 0.495750025571892, "3": 0.0005070682236569497, "2": 1.3687563556433223e-06, "1": 5.683110715223698e-08}, "score": 4.495240092303735}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7421648727692421, "4": 0.2574351333328077, "3": 0.0003986702196483925, "2": 1.2438141150665545e-06, "1": 7.062893021261352e-08}, "score": 4.741763509884949}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999266180325883, "4": 7.324636030284378e-05, "3": 2.2816337513070983e-08, "1": 0, "2": 0}, "score": 4.999926707998757}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998273446066582, "4": 0.00017256199409475658, "3": 3.7353844460322115e-08, "1": 0, "2": 0}, "score": 4.99982736328854}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6341057629020949, "5": 0.36504311831750474, "3": 0.000849824840258014, "2": 1.01090862785239e-06, "1": 0}, "score": 4.3641913747376275}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7579698271520863, "5": 0.19700544717340476, "3": 0.04337866277065938, "2": 0.0016427978247401775, "1": 2.8250061962653797e-06}, "score": 4.150332779892061}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9499118007626924, "4": 0.049943795291085766, "3": 0.0001434191637935398, "2": 8.192807628968737e-07, "1": 4.571798827372568e-08}, "score": 4.949766719649959}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980385593438138, "4": 0.001961111254152698, "3": 3.5598686601188325e-07, "1": 0, "2": 0}, "score": 4.998038176824269}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7585072666116155, "5": 0.23453845906535176, "3": 0.006525116966719658, "2": 0.00042458671391981765, "1": 4.050057416632587e-06}, "score": 4.227152136750532}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8320571421920804, "4": 0.1287230991383875, "2": 0.039119821371270985, "5": 8.685278491397068e-05, "1": 1.3108207463631744e-05}, "score": 3.0897507647954527}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9942430849102423, "4": 0.005756163990528611, "3": 7.903886898622011e-07, "1": 0, "2": 0}, "score": 4.9942422554583095}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982005400728904, "4": 0.0017988827522216321, "3": 5.334646654403397e-07, "1": 0, "2": 0}, "score": 4.998200050239771}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5260986690977755, "5": 0.4729628191632694, "3": 0.0009329807403888835, "2": 5.182246025561896e-06, "1": 9.121632077596566e-08}, "score": 4.472019321843939}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9895927342883316, "4": 0.010402410716840567, "3": 4.76182766586032e-06, "2": 3.164885075734008e-08, "1": 0}, "score": 4.989587970040746}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"3": 0.675966121715828, "2": 0.2698224577938749, "4": 0.053933309765866286, "1": 0.00020665764970598385, "5": 7.149993624092675e-05}, "score": 2.783840546674621}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6412038524993825, "4": 0.3561330079752115, "3": 0.0026121845902096863, "2": 4.969764551139856e-05, "1": 1.176960253011719e-06}, "score": 4.638488793026832}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999689611440499, "4": 0.00031025283379907455, "3": 6.035946901823807e-08, "1": 0, "2": 0}, "score": 4.999689626423871}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998442687373722, "4": 0.00015558038726798488, "3": 2.574740478408249e-08, "1": 0, "2": 0}, "score": 4.999844368098449}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989371481275889, "4": 0.0010626398949474423, "3": 1.6790810520931273e-07, "1": 0, "2": 0}, "score": 4.998937024241997}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9145270249270945, "5": 0.08072268825782035, "3": 0.004738574153622709, "2": 1.1534165661391013e-05, "1": 0}, "score": 4.075961059331605}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9754751610806954, "4": 0.024505835649956457, "3": 1.8906836154509935e-05, "2": 3.7977954131839444e-08, "1": 0}, "score": 4.975456235309161}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.975594395818843, "4": 0.024396107209626802, "3": 9.438117642194995e-06, "2": 4.1789864620953814e-08, "1": 0}, "score": 4.975584890768874}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9976055772144212, "4": 0.0023942376685968814, "3": 2.322854113607107e-07, "1": 0, "2": 0}, "score": 4.997605297873535}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6919542488006858, "4": 0.30731297135934066, "3": 0.0007255618048142466, "2": 6.6731136024046155e-06, "1": 1.7073588613145354e-07}, "score": 4.69121508720379}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9766074381602059, "3": 0.02134985352471766, "5": 0.0020316703332533717, "2": 1.1042898569398588e-05, "1": 3.280768664758548e-08}, "score": 3.980659633317942}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9987730258490731, "4": 0.0012268026078411925, "3": 1.128123520373892e-07, "1": 0, "2": 0}, "score": 4.998772971695391}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9015149346781028, "4": 0.09847297834132812, "3": 1.2047179401399435e-05, "2": 2.5120238524234338e-08, "1": 0}, "score": 4.901502850493124}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992411649910219, "4": 0.0007587169310499926, "3": 3.4962387365632386e-08, "1": 0, "2": 0}, "score": 4.999241213081109}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969418897741832, "4": 0.003057846710813478, "3": 2.570361758230071e-07, "1": 0, "2": 0}, "score": 4.996941639197021}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5852815883231006, "4": 0.4142351670813764, "3": 0.0004817804719738514, "2": 1.3273408208290157e-06, "1": 0}, "score": 4.584797233159646}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5653289527509998, "3": 0.43173817105626766, "2": 0.002129216941399946, "5": 0.0008030919841140768, "1": 5.274604240016704e-07}, "score": 3.564804887340052}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5561577844549397, "4": 0.44364281989375826, "3": 0.00019918629806376856, "2": 1.7908505076719296e-07, "1": 0}, "score": 4.555958256814622}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998910985741908, "4": 0.00010883506357026716, "3": 3.098405870649265e-08, "1": 0, "2": 0}, "score": 4.999891102964459}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995658489408572, "4": 0.000434052397319659, "3": 5.628718205075047e-08, "1": 0, "2": 0}, "score": 4.999565835009919}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.881466527563149, "4": 0.11836516669840332, "3": 0.00016730032623054938, "2": 7.520169299639928e-07, "1": 0}, "score": 4.881297946519805}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9946347222924884, "4": 0.0053637442160491084, "3": 1.512758125673704e-06, "1": 0, "2": 0}, "score": 4.9946332301564285}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9248245917429683, "4": 0.07511728401654932, "3": 5.78001608163512e-05, "2": 2.1835623551322407e-07, "1": 0}, "score": 4.924766452639162}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9960275830058805, "4": 0.0039712117665003, "3": 1.1742545937211404e-06, "2": 6.49042385127528e-09, "1": 0}, "score": 4.996026420155757}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9204331173433715, "4": 0.0795421666356828, "3": 2.447241483121862e-05, "2": 1.509086726491579e-07, "1": 0}, "score": 4.920408428430701}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5072768343748757, "5": 0.4921011274566232, "3": 0.0006190948908606209, "2": 2.645146782142488e-06, "1": 0}, "score": 4.491476888796625}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8239502970549551, "4": 0.17574227565695727, "3": 0.00030521045588977297, "2": 1.8147188605753204e-06, "1": 0}, "score": 4.823641788358692}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8792012360617532, "4": 0.1206794285442963, "3": 0.00011855886140460724, "2": 4.595858863473533e-07, "1": 0}, "score": 4.879082036650691}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998779876841082, "4": 0.00012186599726128967, "3": 1.4354031405704017e-08, "1": 0, "2": 0}, "score": 4.99987810527859}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9948778398310891, "4": 0.005119456489295366, "3": 2.6311540650996628e-06, "2": 2.8753078418762492e-08, "1": 0}, "score": 4.994875194719013}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9470260672876275, "3": 0.037994285961370014, "5": 0.01479467441194042, "2": 0.00018411463095776843, "1": 7.515951667819175e-07}, "score": 3.9764299019020624}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997448916456715, "4": 0.0002549943933271289, "3": 2.122937502413866e-08, "1": 0, "2": 0}, "score": 4.999744963124273}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5247276042955864, "4": 0.47501309828065186, "3": 0.00025891570825195044, "2": 3.401728384905205e-07, "1": 1.1917749422174777e-08}, "score": 4.524467988025732}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987613729325278, "4": 0.001238350533259498, "3": 2.0775756290471105e-07, "1": 0, "2": 0}, "score": 4.998761233866416}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9911363736107498, "4": 0.008859673199302372, "3": 3.882528272171197e-06, "2": 2.4853680169914957e-08, "1": 0}, "score": 4.99113248677691}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9557599880273558, "5": 0.042258794203926704, "3": 0.0019785559866812344, "2": 2.6365350076158392e-06, "1": 1.7023518632558543e-08}, "score": 4.040274914407875}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7376745801014537, "5": 0.26180220580685165, "3": 0.0005226070576967749, "2": 5.145207253378251e-07, "1": 8.731706594524598e-09}, "score": 4.261278565402912}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6586139684217883, "4": 0.3413274836301303, "3": 5.850765251847621e-05, "2": 4.341073830770978e-08, "1": 0}, "score": 4.658555371896278}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.996308533277624, "4": 0.003691224622397031, "3": 2.3690111954032332e-07, "1": 0, "2": 0}, "score": 4.996308301556171}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9959970684750629, "4": 0.004002576500887433, "3": 3.9394087593005545e-07, "1": 0, "2": 0}, "score": 4.995996635773159}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9921185864992049, "4": 0.007875646518917102, "3": 5.692961333248719e-06, "2": 6.113673034980522e-08, "1": 0}, "score": 4.992112784046608}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9990799115412029, "4": 0.0009199290596227079, "3": 1.0372548447233933e-07, "1": 0, "2": 0}, "score": 4.9990798634381814}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9828968718368278, "4": 0.017097910772235488, "3": 5.21976591993255e-06, "2": 5.033350355056783e-09, "1": 0}, "score": 4.982891634722618}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996252855030201, "4": 0.00037456372847182703, "3": 4.580603435633518e-08, "1": 0, "2": 0}, "score": 4.999625344620135}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7878520898332626, "4": 0.21203578953437524, "3": 0.00011199044531452495, "2": 1.2202608543833725e-07, "1": 0}, "score": 4.787739861764493}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9016180107728172, "5": 0.09566216583674846, "3": 0.002716735780625614, "2": 3.0413015278750584e-06, "1": 3.754761410134913e-08}, "score": 4.092939235624435}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9904888369729226, "4": 0.009507620918692807, "3": 3.494099043209665e-06, "2": 1.1444002995565227e-08, "1": 0}, "score": 4.990485356203306}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8297489946606176, "4": 0.1701812727062233, "3": 6.96780646941438e-05, "2": 7.347159264953831e-08, "1": 0}, "score": 4.829679153969207}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999624963432797, "4": 3.7402088980875584e-05, "3": 2.2482198919520845e-08, "1": 0, "2": 0}, "score": 4.999962552943661}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9970524400101042, "4": 0.0029467659444877546, "3": 8.33088464948556e-07, "1": 0, "2": 0}, "score": 4.997051567993699}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9176284948284423, "5": 0.06240884293158437, "3": 0.019905332864739958, "2": 5.70013275528536e-05, "1": 1.7016351657215843e-07}, "score": 4.042389003613742}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8316405772473037, "5": 0.15297458232275987, "3": 0.015348043075717823, "2": 3.608865528673523e-05, "1": 3.8927492300877903e-07}, "score": 4.137553238049508}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9292165752972378, "4": 0.07070613745620884, "3": 7.707250159209713e-05, "2": 1.7806040327090245e-07, "1": 0}, "score": 4.9291391807599}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9768042902963571, "4": 0.023187187866224212, "3": 8.318488419380118e-06, "2": 4.149985100322251e-08, "1": 0}, "score": 4.9767960469018435}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6099400715509947, "4": 0.38879599786730584, "3": 0.001260396405446613, "2": 3.371880356227394e-06, "1": 0}, "score": 4.608673030169971}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6015737746296926, "5": 0.39733016263589854, "3": 0.0010938627936354236, "2": 2.276564612930511e-06, "1": 5.2611347948794356e-08}, "score": 4.3962315376719365}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.542827494070724, "4": 0.4566159835108982, "3": 0.0005549081241464003, "2": 1.4452185531240014e-06, "1": 4.0406224179375284e-08}, "score": 4.542269644064338}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5312748783524964, "5": 0.46818893372062015, "3": 0.0005335517451924564, "2": 2.246938353863795e-06, "1": 7.333792262282078e-08}, "score": 4.467650815818378}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.997945113875249, "4": 0.002054301277088468, "3": 5.925005711330213e-07, "1": 0, "2": 0}, "score": 4.9979445137375}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9873600833424493, "4": 0.012630029587321935, "3": 9.772385069032811e-06, "2": 6.19746751914352e-08, "1": 0}, "score": 4.987350239051739}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7072952433811927, "4": 0.292601928356257, "3": 0.00010257677657705001, "2": 1.4918122423866846e-07, "1": 0}, "score": 4.707192440591311}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8434659882319552, "4": 0.15645973288001322, "3": 7.34277961418233e-05, "2": 6.973900291376475e-07, "1": 0}, "score": 4.843391295286566}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7389426987087343, "5": 0.26010668635375195, "3": 0.0009497393304701691, "2": 6.560748197559643e-07, "1": 0}, "score": 4.259155691766668}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989941326240803, "4": 0.0010057718724182294, "3": 9.640478496455397e-08, "1": 0, "2": 0}, "score": 4.998994035318919}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9420044240246276, "5": 0.03758894078157715, "3": 0.018557968749303544, "2": 0.001842049626264989, "1": 6.233248079194171e-06}, "score": 4.015328178914938}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7090767835045186, "3": 0.28889193157189386, "5": 0.0012212675306899653, "2": 0.0008093682927989796, "1": 6.368727282514525e-07}, "score": 3.7107086852177416}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.593913632513495, "5": 0.4053539552415491, "3": 0.0007298525722788865, "2": 2.3359754557729563e-06, "1": 0}, "score": 4.404619521230622}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9054445775431004, "5": 0.09349649780687264, "3": 0.0010575715391685416, "2": 1.3262820253695702e-06, "1": 0}, "score": 4.092436276183611}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.929759624986346, "5": 0.053423764709513634, "3": 0.0167793636799502, "2": 3.717834834013413e-05, "1": 8.697040052775398e-08}, "score": 4.036569782738026}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9026617088902029, "3": 0.08870225209201751, "5": 0.008263587200080257, "2": 0.00037197258598326786, "1": 4.7434686508221367e-07}, "score": 3.918815966498929}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9943043659770168, "4": 0.005693893466975715, "3": 1.7012198591879797e-06, "2": 1.559581855447873e-08, "1": 0}, "score": 4.994302657170594}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999241149394169, "4": 7.582215694864488e-05, "3": 2.301064274498593e-08, "1": 0, "2": 0}, "score": 4.99992413181874}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9859282014824267, "4": 0.01405158047788041, "3": 2.002672352598884e-05, "2": 9.641731840125531e-08, "1": 1.252659315575748e-08}, "score": 4.9859080255559505}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999288827389523, "4": 7.104038782833532e-05, "3": 7.556837910948795e-09, "1": 0, "2": 0}, "score": 4.99992894449357}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941993670145013, "4": 0.005800457994374335, "3": 2.1039186947693145e-07, "1": 0, "2": 0}, "score": 4.9941991214272425}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9274605677125048, "5": 0.055674547132411795, "3": 0.016829205150987882, "2": 3.500316751994268e-05, "1": 3.3742215671744786e-07}, "score": 4.038774336540483}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9616919739388929, "3": 0.029838215730160805, "5": 0.008304110049975867, "2": 0.00016507560118503653, "1": 4.886540803234851e-07}, "score": 3.9781342741809036}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9854482491955391, "4": 0.014547952746098112, "3": 3.743082829920607e-06, "2": 1.4349740191882171e-08, "1": 0}, "score": 4.985444517447694}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7222599957461197, "4": 0.27759060349605286, "3": 0.00014922430221203564, "2": 1.002455661167177e-07, "1": 0}, "score": 4.722110625984862}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6438379725194018, "5": 0.3554898789662331, "3": 0.0006714500033150088, "2": 4.2986097263125823e-07, "1": 0}, "score": 4.354817664562765}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9508826285818706, "5": 0.04271451016335862, "3": 0.006393410681594294, "2": 9.249546820670979e-06, "1": 5.6977123031444163e-08}, "score": 4.0363024346860925}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5519779605731733, "4": 0.44791174667591466, "3": 0.00011006890270982158, "2": 1.3622566838650289e-07, "1": 0}, "score": 4.55186766757517}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.999345202033818, "4": 0.0006546608779449589, "3": 5.8150113856749534e-08, "1": 0, "2": 0}, "score": 4.999345222770141}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993023434755611, "4": 0.000697557716515278, "3": 6.352158929076036e-08, "1": 0, "2": 0}, "score": 4.999302315215687}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921443977921031, "4": 0.007852903052088984, "3": 2.6174971055746012e-06, "2": 2.2729095343136106e-08, "1": 0}, "score": 4.9921417933033325}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8035050088775839, "5": 0.1931537258742966, "3": 0.003331427793723847, "2": 9.609647655637122e-06, "1": 8.628880233988791e-08}, "score": 4.189802846779362}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9065103330595172, "4": 0.09329604147029923, "3": 0.0001926478783364475, "2": 8.22446008189597e-07, "1": 4.783276366156909e-08}, "score": 4.906315994050431}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7088241348320587, "4": 0.2903697988180951, "3": 0.0008046079643311499, "2": 1.4949885649705612e-06, "1": 5.254305017681561e-08}, "score": 4.708016316144554}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9906413701306567, "4": 0.009347531324581304, "3": 1.0980715061556945e-05, "2": 7.873909854482287e-08, "1": 1.5286328043001623e-08}, "score": 4.990630209659647}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6931106600003126, "3": 0.2950710807416198, "5": 0.009045480846200786, "2": 0.0027684934156877454, "1": 4.1705651656757325e-06}, "score": 3.7084248682124703}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9321674202198816, "5": 0.06495904399907598, "3": 0.0028693682367785796, "2": 4.018479342124583e-06, "1": 3.679348667366538e-08}, "score": 4.062081535393136}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6673690084421181, "4": 0.3325235813658431, "3": 0.00010727231033694313, "2": 9.545069552517476e-08, "1": 0}, "score": 4.667261573542971}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6078323349080389, "5": 0.39083403969870667, "3": 0.0013299578885421681, "2": 3.5032235466950852e-06, "1": 3.584398738020583e-08}, "score": 4.389497017857007}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6075104513786171, "4": 0.3923766534011137, "3": 0.00011261417072994749, "2": 1.6114633044436252e-07, "1": 0}, "score": 4.6073975877441455}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6786745324452289, "5": 0.31871633620267764, "3": 0.002604207168512159, "2": 4.758804865133306e-06, "1": 0}, "score": 4.316102663701089}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9775022708549951, "4": 0.022490753720245074, "3": 6.86121512491965e-06, "2": 3.032310117212763e-08, "1": 0}, "score": 4.977495430992371}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9338961512813221, "4": 0.06609276456946003, "3": 1.099266858107939e-05, "2": 1.6537720074333804e-08, "1": 0}, "score": 4.933885195525382}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9266463052117916, "4": 0.0733404999120029, "3": 1.309666421840243e-05, "2": 1.654564353976792e-08, "1": 0}, "score": 4.926633251131035}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999243533313535, "4": 7.558543137719189e-05, "3": 2.3137341717986664e-08, "1": 0, "2": 0}, "score": 4.999924368291058}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5155552003884531, "5": 0.4832120474672775, "3": 0.0012236109459922157, "2": 8.797226998022485e-06, "1": 2.3287313887617945e-07}, "score": 4.481970196993865}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"4": 0.823240152116554, "3": 0.1351470140639812, "5": 0.03899642514509801, "2": 0.002613096401733525, "1": 3.154779353234704e-06}, "score": 3.8986137379719352}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6751613700100075, "4": 0.322771059884239, "3": 0.002041249007298724, "2": 2.536632629304926e-05, "1": 7.275144322159572e-07}, "score": 4.673067358766587}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9637841348027976, "4": 0.03618976264527908, "3": 2.5682120719942187e-05, "2": 2.0507829579862013e-07, "1": 0}, "score": 4.963758250073627}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993029390599354, "4": 0.0006968602287172435, "3": 1.1019448355115855e-07, "1": 0, "2": 0}, "score": 4.999302919319218}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.98392174060323, "4": 0.01607297964187287, "3": 5.230273430958733e-06, "2": 5.92393393323572e-08, "1": 0}, "score": 4.9839163822501895}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9836085274949671, "4": 0.0163904668959007, "3": 9.446588310329236e-07, "1": 0, "2": 0}, "score": 4.983607642787319}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6852924277443484, "4": 0.31456105126861705, "3": 0.0001461904988655643, "2": 3.292639922116612e-07, "1": 0}, "score": 4.685145579556238}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.737901317092032, "4": 0.26205056438659247, "3": 4.787127118365815e-05, "2": 9.932157684727339e-08, "1": 0}, "score": 4.737853356327319}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970430800248475, "4": 0.0029565418131982458, "3": 3.6207715951569514e-07, "1": 0, "2": 0}, "score": 4.997042733984915}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9158944501878038, "5": 0.07223034720462142, "3": 0.011854959212524992, "2": 2.0193192809087914e-05, "1": 0}, "score": 4.060335004635431}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6239843194593527, "5": 0.3750808598458973, "3": 0.0009325703191624034, "2": 2.0690344681737033e-06, "1": 3.768506405140155e-08}, "score": 4.3741440921506705}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5128234987654393, "5": 0.486523438848338, "3": 0.0006523069660547143, "2": 8.153087182757973e-07, "1": 0}, "score": 4.485869472166828}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8821876416213894, "4": 0.11777396999099675, "3": 3.829004948890242e-05, "2": 5.089566927579358e-08, "1": 0}, "score": 4.882149291631892}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995420298203714, "4": 0.00045770233899242727, "3": 1.8941196216096392e-07, "1": 0, "2": 0}, "score": 4.999541918801158}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999441398352371, "4": 5.572748977575025e-05, "3": 1.5275570255244967e-08, "1": 0, "2": 0}, "score": 4.999944241952537}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"4": 0.94520635712408, "5": 0.049299787908577405, "3": 0.005485044896307109, "2": 8.523282682120477e-06, "1": 6.031861948683934e-08}, "score": 4.043797525409862}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9869272652696652, "4": 0.01307058491318003, "3": 2.095737579424469e-06, "2": 1.1613936936111202e-08, "1": 0}, "score": 4.986925188214619}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993647278708389, "4": 0.0006351962193207635, "3": 7.51200001537259e-08, "1": 0, "2": 0}, "score": 4.999364653540178}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995415532188544, "4": 0.0004583172170270558, "3": 4.949981028526593e-08, "1": 0, "2": 0}, "score": 4.999541583746649}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995313064511533, "4": 0.00046856941636200423, "3": 6.544419776065209e-08, "1": 0, "2": 0}, "score": 4.999531299667735}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9463467970812037, "4": 0.05361731081930415, "3": 3.576395554863742e-05, "2": 8.126706557055239e-08, "1": 0}, "score": 4.946310914951626}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.989773367279527, "4": 0.010223370030300443, "3": 3.230744344709889e-06, "2": 4.200875000092963e-09, "1": 0}, "score": 4.989770155594559}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9984230618756138, "4": 0.0015763287682604944, "3": 5.811679798135448e-07, "1": 0, "2": 0}, "score": 4.998422508851312}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999520068687072, "4": 4.796149770891087e-05, "3": 1.4866031376856531e-08, "1": 0, "2": 0}, "score": 4.999952008769424}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9993850879359619, "4": 0.0006148138616214009, "3": 8.954934704315476e-08, "1": 0, "2": 0}, "score": 4.999385007034363}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9365782638573674, "5": 0.06033118166689506, "3": 0.0030862485102825603, "2": 4.21448566022555e-06, "1": 0}, "score": 4.057236509421276}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9705131837236126, "4": 0.029473727667129634, "3": 1.2958806011843952e-05, "2": 3.104109081540487e-08, "1": 0}, "score": 4.970500258684115}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8392991253603488, "4": 0.160641067051334, "3": 5.969770383683163e-05, "2": 9.193086589925191e-08, "1": 0}, "score": 4.8392392588621576}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997190387070186, "4": 0.00028084911223057423, "3": 9.310331932213261e-08, "1": 0, "2": 0}, "score": 4.99971896467577}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998178099986144, "4": 0.00018201617522026374, "3": 1.4272887290913488e-07, "1": 0, "2": 0}, "score": 4.9998176983613645}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"4": 0.978861485657955, "3": 0.012383942564810131, "5": 0.0087476446299326, "2": 7.003986997370915e-06, "1": 4.6810888538740674e-08}, "score": 3.9963495541098424}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9938657836018145, "4": 0.0061321160061050895, "3": 2.079277667095462e-06, "1": 0, "2": 0}, "score": 4.993863725308997}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6949990641256849, "5": 0.3045250588939574, "3": 0.0004756781918079435, "2": 2.3049192676587316e-07, "1": 0}, "score": 4.304048910078919}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971004339852668, "4": 0.0028992844900526922, "3": 2.8468913681324716e-07, "1": 0, "2": 0}, "score": 4.99710014614085}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997058145610249, "4": 0.00029414315128344873, "3": 2.5568543769707877e-08, "1": 0, "2": 0}, "score": 4.999705805706712}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8038980189100466, "4": 0.19573474072955496, "3": 0.00036426971115311265, "2": 2.694321898285437e-06, "1": 9.53267855686282e-08}, "score": 4.803528220013799}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8276729007930731, "4": 0.17220950346165215, "3": 0.00011716574519917515, "2": 3.4055676994897183e-07, "1": 0}, "score": 4.827555127953602}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9390597408679979, "3": 0.04627581076928473, "5": 0.01451031649682016, "2": 0.00015363145086117952, "1": 5.11369201396727e-07}, "score": 3.967925709069556}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996425527394996, "4": 0.00035735459708656167, "3": 4.8345485048345265e-08, "1": 0, "2": 0}, "score": 4.9996425486961025}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9985057794608039, "4": 0.0014935103355159245, "3": 7.282597885518608e-07, "1": 0, "2": 0}, "score": 4.9985050331719}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6308510930169478, "4": 0.3688118524265802, "3": 0.0003362623160705149, "2": 7.801590716831438e-07, "1": 2.5916551974142118e-08}, "score": 4.6305131839097875}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999155329675407, "4": 8.436491009344624e-05, "3": 1.3529112390269313e-08, "1": 0, "2": 0}, "score": 4.999915608024206}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9970904754944127, "4": 0.002909026761378627, "3": 4.853221207378858e-07, "1": 0, "2": 0}, "score": 4.997090002558233}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9943020134556699, "4": 0.005697844121412986, "3": 1.0173921635593726e-07, "1": 0, "2": 0}, "score": 4.994301952168336}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999996945503965, "4": 3.00774478767235e-06, "3": 2.043889963414485e-09, "1": 0, "2": 0}, "score": 4.9999969881672985}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9937832447864564, "4": 0.006211533332927374, "3": 5.124031635313883e-06, "2": 4.2468848765227206e-08, "1": 0}, "score": 4.993778090852685}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9991322665985597, "4": 0.0008668005966204397, "3": 8.585198801789015e-07, "1": 0, "2": 0}, "score": 4.999131482299101}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.984974434469678, "4": 0.01499563680290496, "3": 2.9701262637860433e-05, "2": 1.8436561736776663e-07, "1": 3.242788941490229e-08}, "score": 4.984944277702746}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989402440383959, "4": 0.0010596129277989775, "3": 1.524195379712407e-07, "1": 0, "2": 0}, "score": 4.998940082243073}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5892114862087036, "4": 0.41041115692718744, "3": 0.00037638688278381505, "2": 9.533440315099539e-07, "1": 0}, "score": 4.588833202434448}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5895321634106713, "5": 0.40866321391955734, "3": 0.0017951009842307112, "2": 9.197563002791696e-06, "1": 1.4812386315343294e-07}, "score": 4.4068493450426764}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9664719915584103, "4": 0.03351152062557572, "3": 1.6437898581764537e-05, "2": 4.7497773532708434e-08, "1": 4.9534179683190965e-09}, "score": 4.966455441355262}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9864421553281681, "4": 0.0135489218918368, "3": 8.800403370269465e-06, "2": 3.9217843593793655e-08, "1": 0}, "score": 4.986433358519706}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999839382170425, "4": 0.00016051069212689588, "3": 3.1965999968032344e-08, "1": 0, "2": 0}, "score": 4.9998394253638025}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995284469161198, "4": 0.0004712145723807227, "3": 2.9965950206480497e-07, "1": 0, "2": 0}, "score": 4.999528186090284}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7289819552669979, "5": 0.27009838431621386, "3": 0.0009172464178970621, "2": 2.1777768392951847e-06, "1": 6.954811651253141e-08}, "score": 4.269176618565015}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5310469731375834, "4": 0.4686490897839997, "3": 0.0003034016659890962, "2": 5.555801243579106e-07, "1": 0}, "score": 4.530742449607493}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9420043119261078, "5": 0.05562876808144579, "3": 0.0023651212260022555, "2": 1.6099346014666108e-06, "1": 1.8775180978658647e-08}, "score": 4.05326037971798}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995489331912348, "4": 0.0004509620808203537, "3": 8.467105747497624e-08, "1": 0, "2": 0}, "score": 4.9995488685680165}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8095840837839119, "3": 0.183453380680926, "5": 0.0037705967534838454, "2": 0.0031871441944459986, "1": 4.558558968779356e-06}, "score": 3.8139292080887937}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9605796093214272, "4": 0.039358453449957254, "3": 6.107762266691954e-05, "2": 5.925070886751505e-07, "1": 0}, "score": 4.96051760323774}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9553079688651452, "5": 0.034975551155452624, "3": 0.009615130764325698, "2": 0.00010070128476293915, "1": 4.958650618283372e-07}, "score": 4.025157534052003}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9370947980339842, "4": 0.06286544061836817, "3": 3.9462172623621455e-05, "2": 1.6738622001355916e-07, "1": 0}, "score": 4.937055124582295}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994470010203297, "4": 0.0005526835293018407, "3": 2.4614476462786955e-07, "1": 0, "2": 0}, "score": 4.99944682414283}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998236499315017, "4": 0.00017620296801923598, "3": 1.144379594116027e-07, "1": 0, "2": 0}, "score": 4.9998235681502985}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5112353946269723, "5": 0.488364170700838, "3": 0.0003990515306159779, "2": 9.593316431498962e-07, "1": 0}, "score": 4.487963407310674}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999897933310884, "4": 1.0095437185550034e-05, "3": 3.130415793009091e-09, "1": 0, "2": 0}, "score": 4.999989898300891}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5784505590763827, "5": 0.4212159885172897, "3": 0.000332896808630596, "2": 3.2604187920873487e-07, "1": 0}, "score": 4.420882536240936}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999711292653989, "4": 0.00028858150468750554, "3": 4.624761231232907e-08, "1": 0, "2": 0}, "score": 4.9997113259771115}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5601264876244247, "4": 0.43920579255336795, "3": 0.0006625926240431064, "2": 4.5582581138157385e-06, "1": 1.5608579701742494e-07}, "score": 4.559454541199949}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6729735040656611, "5": 0.3257889499682579, "3": 0.00123612227110147, "2": 1.28211307670173e-06, "1": 0}, "score": 4.324550309421454}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9975899169249881, "4": 0.002409850419507939, "3": 2.2456155056807694e-07, "1": 0, "2": 0}, "score": 4.997589700437882}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9947782705750939, "4": 0.005220965147611307, "3": 7.402669296849663e-07, "1": 0, "2": 0}, "score": 4.994777554193138}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9346309626106701, "4": 0.06535944630055562, "3": 9.4576842380485e-06, "2": 3.137673946235581e-08, "1": 0}, "score": 4.9346215375303295}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998782260650476, "4": 0.00012169690374443307, "3": 3.662495493696392e-08, "1": 0, "2": 0}, "score": 4.999878229841425}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.629920744431524, "3": 0.36682448053530586, "2": 0.002033461023500199, "5": 0.0012199968526931653, "1": 1.2436089026680559e-06}, "score": 3.6303248362547826}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.928791477926142, "5": 0.0659551706707379, "3": 0.005245278187144241, "2": 8.058710514813276e-06, "1": 0}, "score": 4.060693775942956}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7721172749018248, "4": 0.22756540213364618, "3": 0.00031605667790552604, "2": 1.160576144332577e-06, "1": 2.6131613771055602e-08}, "score": 4.771798880095669}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941798040477705, "4": 0.0058162090235313445, "3": 3.92048965489399e-06, "2": 5.2852860564117006e-08, "1": 0}, "score": 4.9941757913594484}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8652757385131108, "3": 0.10887110711435388, "5": 0.024633831909559194, "2": 0.0012190342891030281, "1": 2.3221945167060386e-07}, "score": 3.9133239547087357}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7982205909261257, "3": 0.19362975940845178, "2": 0.00618517487182866, "5": 0.001947365783352368, "1": 1.7000768653813762e-05}, "score": 3.795896232232766}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9786107138958421, "4": 0.021387562874291232, "3": 1.7315441072412355e-06, "1": 0, "2": 0}, "score": 4.978608974215343}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.794877431839975, "4": 0.20503737487457782, "3": 8.497087561601324e-05, "2": 1.7811721360031153e-07, "1": 0}, "score": 4.794792139933356}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999870516788303, "4": 1.2922778868959368e-05, "3": 9.678586200424081e-09, "1": 0, "2": 0}, "score": 4.999987057863753}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999905085465441, "4": 9.393035946627935e-06, "3": 5.576357787088457e-09, "1": 0, "2": 0}, "score": 4.999990595810465}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7835235658296743, "3": 0.2156965759162993, "5": 0.0005621251758739888, "2": 0.0002175669366651555, "1": 1.4336944597469253e-07}, "score": 3.784429980368937}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9937792460094812, "4": 0.006220434620460897, "3": 2.9944861601595017e-07, "1": 0, "2": 0}, "score": 4.993778966358375}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6060830840001542, "5": 0.3919597982247349, "3": 0.0019525911375059333, "2": 4.491800205171004e-06, "1": 4.0432415897843725e-08}, "score": 4.389998100007526}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9916780497469269, "4": 0.00832101197445886, "3": 8.359583881840349e-07, "1": 0, "2": 0}, "score": 4.991677315257186}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9937268518706176, "4": 0.006272194409511177, "3": 8.904908583668901e-07, "1": 0, "2": 0}, "score": 4.993726024212075}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8774662200961627, "5": 0.11880901394191562, "3": 0.0037190166017988554, "2": 5.485978963692792e-06, "1": 0}, "score": 4.115079055691845}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9981736892387826, "4": 0.0018262236928744437, "3": 4.6853786957118274e-08, "1": 0, "2": 0}, "score": 4.998173682526106}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8459437592615034, "5": 0.15298083911112734, "3": 0.0010728442281610412, "2": 2.40170897763549e-06, "1": 0}, "score": 4.151903215114857}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9973707319958455, "4": 0.0026285253328290664, "3": 7.316167687785416e-07, "2": 5.4999215964527545e-09, "1": 0}, "score": 4.99736999491926}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951458621917281, "4": 0.004849476102356597, "3": 4.6458370379782765e-06, "2": 2.465825756648546e-08, "1": 0}, "score": 4.9951411582915}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9355287327034426, "5": 0.06259623164826975, "3": 0.0018720696414302057, "2": 2.9081861129914427e-06, "1": 0}, "score": 4.060718349145394}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7500936601865026, "4": 0.24981775673748524, "3": 8.831434553147681e-05, "2": 1.6342657991026388e-07, "1": 0}, "score": 4.750005097966274}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9035794472990005, "4": 0.09622236152861505, "3": 0.00019740778382593076, "2": 6.279508109868186e-07, "1": 0}, "score": 4.903380924033049}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990482586933288, "4": 0.0009515204300928375, "3": 1.930524351936507e-07, "1": 0, "2": 0}, "score": 4.999048093438551}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7396433118515433, "3": 0.24126282006720207, "2": 0.01076401556601978, "5": 0.008293580476518448, "1": 3.597576646240532e-05}, "score": 3.7453947265454115}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9611320024264425, "5": 0.022368713839825038, "3": 0.016454414156265428, "2": 4.449053891714391e-05, "1": 2.3289642735447155e-07}, "score": 4.005824620767664}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9979477271975404, "4": 0.002051730490934425, "3": 5.647436079688131e-07, "1": 0, "2": 0}, "score": 4.997947140067899}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5105592936163258, "4": 0.48928739123763837, "3": 0.00015316037238681217, "2": 1.021352419931719e-07, "1": 0}, "score": 4.510405955840411}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987715971052815, "4": 0.0012282596871421843, "3": 6.489910524520806e-08, "1": 0, "2": 0}, "score": 4.998771610418454}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992003392991701, "4": 0.0007995487915281201, "3": 7.644433561433401e-08, "1": 0, "2": 0}, "score": 4.99920029829144}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5519795944303547, "3": 0.36671430301084573, "2": 0.06691075917770659, "5": 0.013852106002031638, "1": 0.0005430285288998936}, "score": 3.511687097064845}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8665296433216853, "4": 0.13338483935133616, "3": 8.522003493104669e-05, "2": 2.687839338465011e-07, "1": 0}, "score": 4.866443910419568}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9536701500360252, "4": 0.04631752406380512, "3": 1.2267329102431396e-05, "2": 4.4393711962671286e-08, "1": 0}, "score": 4.9536578074398445}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9294815884796332, "4": 0.07051120116579229, "3": 7.1588085104091005e-06, "2": 3.370505536526064e-08, "1": 0}, "score": 4.929474378843772}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9686306072875773, "5": 0.02358174696243334, "3": 0.007766163457946086, "2": 2.114352174213233e-05, "1": 6.531089299181474e-08}, "score": 4.015773104841627}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5494247814222202, "5": 0.4499799287456275, "3": 0.0005939339737992182, "2": 1.2901178334533423e-06, "1": 3.722594025493385e-08}, "score": 4.449383315672318}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9976010656531604, "4": 0.0023980149213060236, "3": 8.39384459531644e-07, "1": 0, "2": 0}, "score": 4.997600306117701}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.978195432674427, "5": 0.018872172431926015, "3": 0.0029303637995262335, "2": 2.0071896466767386e-06, "1": 0}, "score": 4.015937794634091}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8629939917275011, "4": 0.1366259744792977, "3": 0.0003777088867230067, "2": 2.3087622489508416e-06, "1": 4.2523711455229706e-08}, "score": 4.862611514989902}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997091664126677, "4": 0.0029081096898246907, "3": 1.7072991048001337e-07, "1": 0, "2": 0}, "score": 4.997091548689071}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7397602734987574, "5": 0.25850857847353703, "3": 0.0017277147456084435, "2": 3.285942621516427e-06, "1": 7.765374960338906e-08}, "score": 4.256774076774926}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.671510873700193, "5": 0.32774801919587265, "3": 0.0007403790301439187, "2": 7.213300769882141e-07, "1": 1.8056989449526705e-08}, "score": 4.327006139635096}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8475565468554576, "5": 0.1517907881478462, "3": 0.0006520134287548179, "2": 6.175968121026852e-07, "1": 0}, "score": 4.15113754465978}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993511583888156, "4": 0.0006482978643628464, "3": 4.419818584242853e-07, "1": 0, "2": 0}, "score": 4.999350818105857}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.907932620165953, "4": 0.09201216338183847, "3": 5.503118683889836e-05, "2": 1.616282325087905e-07, "1": 1.59739430759731e-08}, "score": 4.907877224758059}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9349609829774777, "5": 0.043406533835591295, "3": 0.02158601128039286, "2": 4.6167798733610035e-05, "1": 2.3754803055558146e-07}, "score": 4.021727475759815}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8628966083504951, "3": 0.13439823277164978, "2": 0.0016427740043444172, "5": 0.0010610837367348391, "1": 1.305449672387936e-06}, "score": 3.863373387196636}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9996370713145544, "4": 0.00036274008479955227, "3": 1.3506374294259292e-07, "1": 0, "2": 0}, "score": 4.9996369897682795}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963180013422345, "4": 0.0036815073672613534, "3": 5.03136163850565e-07, "1": 0, "2": 0}, "score": 4.996317486404033}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9914439897861758, "4": 0.00855481497136386, "3": 1.1768890490703527e-06, "2": 4.651895807019888e-09, "1": 0}, "score": 4.991442817177604}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9851497976897746, "4": 0.014844448826759796, "3": 5.67072830284425e-06, "2": 2.7058896358860633e-08, "1": 0}, "score": 4.9851441277125295}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9978454020855745, "4": 0.0021542147650399483, "3": 3.9140265447770913e-07, "1": 0, "2": 0}, "score": 4.997845002447437}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8913980464720148, "5": 0.09596152011542136, "3": 0.01261787272329887, "2": 2.209451876247665e-05, "1": 1.640676490446256e-07}, "score": 4.083298991316514}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9633389751536848, "4": 0.03664470264917686, "3": 1.62215005698803e-05, "2": 6.459363244363976e-08, "1": 0}, "score": 4.963322659244627}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5571698992400911, "5": 0.44251144077926, "3": 0.0003183325394592661, "2": 2.486205495957136e-07, "1": 0}, "score": 4.442192645852609}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"5": 0.813461792692058, "4": 0.1864583479928982, "3": 7.975700365738387e-05, "2": 1.0095691452312748e-07, "1": 0}, "score": 4.813381834876275}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998964621704111, "4": 0.000103388378068209, "3": 2.191656704592622e-08, "1": 0, "2": 0}, "score": 4.999896567775607}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9820092943083566, "4": 0.017986226651823853, "3": 4.53268082460055e-06, "2": 1.1112524848760013e-08, "1": 0}, "score": 4.982004675814213}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996990219729768, "4": 0.0003008541386106929, "3": 9.116798893502382e-08, "1": 0, "2": 0}, "score": 4.999698963515562}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990562267343958, "4": 0.0009433275375065158, "3": 3.571410625564486e-07, "2": 2.469411435311411e-09, "1": 0}, "score": 4.999055950690835}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8481815365338624, "5": 0.14455592819219276, "3": 0.0072404856217976364, "2": 2.1475227423471904e-05, "1": 3.02221090399879e-07}, "score": 4.137271622818112}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9079154113741585, "5": 0.04669553636148362, "3": 0.045336537693353975, "2": 5.233804570601749e-05, "1": 1.6234680797022362e-07}, "score": 4.001253835554071}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6986262165812372, "5": 0.29672333687277674, "3": 0.0046359803132892735, "2": 1.3662386662676953e-05, "1": 2.2116827496162724e-07}, "score": 4.292059538457935}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7912414589167664, "4": 0.20854936566260132, "3": 0.0002083773373332535, "2": 5.370135553600469e-07, "1": 0}, "score": 4.7910322140669}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9284243007998245, "4": 0.07151228684926554, "3": 6.299356371788072e-05, "2": 1.5341901480363273e-07, "1": 0}, "score": 4.928361246755609}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5365897408376359, "5": 0.4628181345543453, "3": 0.0005913928739957762, "2": 6.917411583012646e-07, "1": 2.6774309765799296e-08}, "score": 4.462225283985053}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999591694239494, "4": 0.00040816828718957625, "3": 1.0178836826666798e-07, "1": 0, "2": 0}, "score": 4.9995916281215}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9085281377217868, "4": 0.0914421268730109, "3": 2.9695322979318528e-05, "2": 3.348239696336543e-08, "1": 0}, "score": 4.908498381429945}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9902369876856745, "4": 0.0097614922087781, "3": 1.491850891275968e-06, "1": 0, "2": 0}, "score": 4.990235523813547}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998063722682694, "4": 0.00019351336076441856, "3": 7.623097201082805e-08, "1": 0, "2": 0}, "score": 4.9998063341699055}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8644782700790299, "4": 0.13529252404341824, "3": 0.0002278222131664329, "2": 1.251321956848089e-06, "1": 6.735336314493115e-08}, "score": 4.864247799328517}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8293204653239808, "5": 0.1690577510911561, "3": 0.0016179813289472936, "2": 3.6941835083935726e-06, "1": 8.992201879869053e-08}, "score": 4.167432114668093}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5483163377039038, "4": 0.4510473301885951, "3": 0.0006347819524558236, "2": 1.3800028411402462e-06, "1": 6.82989120149138e-08}, "score": 4.547678646631904}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99900888827599, "4": 0.0009908547534666925, "3": 2.079643845565097e-07, "1": 0, "2": 0}, "score": 4.999008729269186}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9494272537393237, "5": 0.046758790913240006, "3": 0.0037959977156986823, "2": 1.7528735414430476e-05, "1": 2.9789463106435687e-07}, "score": 4.042926847666309}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9271173873387294, "5": 0.056085419623087225, "3": 0.016721984302301283, "2": 7.434835577225161e-05, "1": 6.090009556657868e-07}, "score": 4.039212921463686}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9992779386618437, "4": 0.0007216653721391254, "3": 2.992950382719935e-07, "1": 0, "2": 0}, "score": 4.999277735967962}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9429583498816264, "4": 0.057006613018997, "3": 3.4811805159069546e-05, "2": 1.748762947724322e-07, "1": 0}, "score": 4.942923235864109}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999748931371826, "4": 2.5059889949160235e-05, "3": 2.3961343323887415e-08, "1": 0, "2": 0}, "score": 4.999974892186787}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999918197754583, "4": 8.132859290392011e-06, "3": 2.866053043101723e-09, "1": 0, "2": 0}, "score": 4.999991861408242}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9303137352437475, "5": 0.06582855949094084, "3": 0.003853956484692982, "2": 3.6626962552702257e-06, "1": 3.921298088268236e-08}, "score": 4.061967162879282}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994953359297604, "4": 0.005046301400340509, "3": 3.7250625772729364e-07, "1": 0, "2": 0}, "score": 4.994952953754728}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5696293743939337, "5": 0.42919958291462745, "3": 0.0011685632222171668, "2": 2.160659627038217e-06, "1": 0}, "score": 4.428026834832219}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994770095372134, "4": 0.0005229119310252452, "3": 4.769649127184015e-08, "1": 0, "2": 0}, "score": 4.999476992659865}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.98792823649386, "4": 0.012069942593679972, "3": 1.6881792106148707e-06, "1": 0, "2": 0}, "score": 4.987926679445367}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9998781068795701, "4": 0.00012178833244632567, "3": 3.1822157915817666e-08, "1": 0, "2": 0}, "score": 4.999878148014347}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9975104433989919, "4": 0.002489304312781732, "3": 2.1028270442745392e-07, "1": 0, "2": 0}, "score": 4.997510275017227}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998932440088264, "4": 0.00010671679586515268, "3": 2.128462193208479e-08, "1": 0, "2": 0}, "score": 4.999893240632979}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996919947733519, "4": 0.00030798021933234885, "3": 1.7940591676621512e-08, "1": 0, "2": 0}, "score": 4.999691983897307}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996588742266319, "4": 0.00034098331892015504, "3": 4.234726494949896e-08, "1": 0, "2": 0}, "score": 4.999658931952406}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9820956353789576, "4": 0.01789241498133158, "3": 1.1884423082255634e-05, "2": 6.728261194653322e-08, "1": 0}, "score": 4.982083614361684}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9865406461362898, "4": 0.013455110261529754, "3": 4.115430961147575e-06, "2": 9.183357118340693e-09, "1": 0}, "score": 4.986536629724499}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9090941816461856, "4": 0.09086707087773843, "3": 3.8599200273933275e-05, "2": 6.979412498429203e-08, "1": 0}, "score": 4.909055514201863}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9955754273905957, "4": 0.004422478471014304, "3": 1.9824938214242902e-06, "2": 3.873129141217693e-08, "1": 0}, "score": 4.995573440024713}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997915939795524, "4": 0.00020820112465434274, "3": 9.370708845779017e-08, "1": 0, "2": 0}, "score": 4.999791611437999}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9591784357658658, "3": 0.03787084970131394, "5": 0.0029080640328609697, "2": 4.245089762352383e-05, "1": 4.3096933106083724e-08}, "score": 3.964952177760327}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7730877021299413, "5": 0.2257171753307781, "3": 0.0011942686372457248, "2": 7.755014380341069e-07, "1": 1.5134741110058984e-08}, "score": 4.224521324490967}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5140794260889081, "5": 0.4855782403809498, "3": 0.000342003016761676, "2": 2.350590682808212e-07, "1": 0}, "score": 4.485235813563902}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975243225566032, "4": 0.0024751593529594245, "3": 4.73758565737892e-07, "2": 2.0153237187193867e-09, "1": 0}, "score": 4.997523886979159}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9368817175351997, "4": 0.06310604586496742, "3": 1.2185120277352981e-05, "2": 2.1529193190642535e-08, "1": 0}, "score": 4.936869517416119}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5433335907915894, "5": 0.4564449626323808, "3": 0.00022111292811725377, "2": 2.111835872539068e-07, "1": 0}, "score": 4.45622348320819}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998638116144802, "4": 0.00013610975168390445, "3": 1.988031084050359e-08, "1": 0, "2": 0}, "score": 4.999863850479695}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8470497070860793, "4": 0.15292219749972738, "3": 2.8068938064352758e-05, "2": 1.323629711033153e-08, "1": 0}, "score": 4.847021622889845}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6897824299688564, "4": 0.31005418700121784, "3": 0.00016271131515982592, "2": 5.869418999239544e-07, "1": 0}, "score": 4.689618603230841}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9789787984687194, "4": 0.021020796957578285, "3": 4.0867811322000793e-07, "1": 0, "2": 0}, "score": 4.978978385772477}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9864237124848199, "4": 0.013567618743642073, "3": 8.515172378124335e-06, "2": 3.384156690300715e-08, "1": 0}, "score": 4.986415247760023}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999827604126034, "4": 1.7147142779677784e-05, "3": 1.2367274577488439e-08, "1": 0, "2": 0}, "score": 4.999982828121296}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9987947806609042, "4": 0.0012047195231547035, "3": 4.691126056425546e-07, "1": 0, "2": 0}, "score": 4.998794342214617}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6580771139965035, "4": 0.33996853832218893, "3": 0.001952693846500989, "2": 9.940155366295193e-07, "1": 0}, "score": 4.656122865041439}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9761718131484398, "4": 0.023814119926490376, "3": 1.3909034012265652e-05, "2": 4.490853370555563e-08, "1": 0}, "score": 4.976157924586146}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8099633574945142, "4": 0.18996745708338306, "3": 6.885174418465708e-05, "2": 2.0793943032764681e-07, "1": 0}, "score": 4.809894191706339}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9852810180371463, "4": 0.014714945514821824, "3": 3.967860600821923e-06, "2": 7.899763615576768e-09, "1": 0}, "score": 4.985277094171186}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7598005381122899, "4": 0.24010916617372025, "3": 9.012121143725098e-05, "2": 1.244718812455223e-07, "1": 0}, "score": 4.759710205965902}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997623992715251, "4": 0.00023741521207959652, "3": 5.6543646081418825e-08, "1": 0, "2": 0}, "score": 4.999762471669992}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9399103101541406, "4": 0.060078784685589595, "3": 1.0747815858361572e-05, "2": 1.197874397800275e-07, "1": 0}, "score": 4.939899358063177}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8803013649196562, "3": 0.08813996646875599, "5": 0.027857788299959003, "2": 0.0036755996116270982, "1": 2.4945203468495818e-05}, "score": 3.9322917642816644}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7497597703205858, "4": 0.24857084090672948, "3": 0.0016478184786692226, "2": 1.9776879590562036e-05, "1": 1.2229849587325427e-06}, "score": 4.748069155848549}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9562166722478727, "5": 0.02306776708886173, "3": 0.020691305315852688, "2": 2.3900360869465117e-05, "1": 1.832552219993242e-07}, "score": 4.002328111685414}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.666090547816982, "4": 0.3334093048789016, "3": 0.0004990579184051692, "2": 8.178302828898478e-07, "1": 0}, "score": 4.665590034982598}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9705889857043923, "5": 0.02411722411955553, "3": 0.005286252480190543, "2": 7.283988317193851e-06, "1": 8.815404865521099e-08}, "score": 4.018816142315663}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8271356423962756, "4": 0.1728296416494189, "3": 3.463385105452836e-05, "2": 7.100425728089349e-08, "1": 0}, "score": 4.8271008757166936}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6156733882140275, "4": 0.3841089855984922, "3": 0.00021743578334904528, "2": 2.1366381822990613e-07, "1": 1.5911129564129727e-08}, "score": 4.61545545326176}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8792496286295371, "5": 0.11996862844545256, "3": 0.0007813397371171645, "2": 4.2271189045348384e-07, "1": 1.250271520282729e-08}, "score": 4.11918640195926}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9905949259894116, "4": 0.009404264710379329, "3": 7.117942087264527e-07, "1": 0, "2": 0}, "score": 4.9905943107840915}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995483374102708, "4": 0.00045142225167081823, "3": 1.5900550701682896e-07, "1": 0, "2": 0}, "score": 4.999548259700574}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9299501987498663, "5": 0.045264939890597405, "3": 0.024712378673918314, "2": 7.176755961189608e-05, "1": 5.83891884813869e-07}, "score": 4.020407277099932}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5091474595334041, "4": 0.4899132423413658, "3": 0.0009367323145990531, "2": 2.351735480562209e-06, "1": 5.7302304264164136e-08}, "score": 4.508205931513821}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9472147052543375, "4": 0.05273428846481676, "3": 5.0690958327840794e-05, "2": 2.1192995877494128e-07, "1": 1.1707829861947389e-08}, "score": 4.947163642153043}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997850428466002, "4": 0.00021489414498222962, "3": 2.832961820210866e-08, "1": 0, "2": 0}, "score": 4.999785049188327}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9083594033763301, "4": 0.09154641203004164, "3": 9.368813540028497e-05, "2": 4.548232295350694e-07, "1": 0}, "score": 4.908264843410075}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9547153574068585, "4": 0.0452635050147458, "3": 2.094656262996286e-05, "2": 6.747882445928759e-08, "1": 9.493010936386101e-09}, "score": 4.9546943562846435}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9791795939040446, "4": 0.020779486601345955, "3": 4.068801421169064e-05, "2": 2.8452235785008336e-07, "1": 1.2619330903234766e-08}, "score": 4.979138234695644}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9519285590703194, "4": 0.048044121133004325, "3": 2.7270309819141738e-05, "2": 3.3632095590750715e-08, "1": 0}, "score": 4.951901236588476}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999882437011058, "4": 1.1679189209132426e-05, "3": 3.4570265360577832e-09, "1": 0, "2": 0}, "score": 4.9999883138958765}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999866940725246, "4": 1.3193371679257791e-05, "3": 1.598361023555497e-08, "1": 0, "2": 0}, "score": 4.999986774659823}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9002926246535056, "5": 0.06667065352602211, "3": 0.03294443251462336, "2": 9.174450168172125e-05, "1": 3.234536532125585e-07}, "score": 4.033541769071564}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8995592804349146, "4": 0.10030520410163266, "3": 0.000135180045189609, "2": 3.546485634215569e-07, "1": 2.3499328280813345e-08}, "score": 4.89942328216259}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7806582070123806, "5": 0.21831207569153085, "3": 0.0010276958720798674, "2": 2.0214792754165153e-06, "1": 3.697484575354626e-08}, "score": 4.217280217890451}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989040781614494, "4": 0.0010950995572320617, "3": 8.155557942475533e-07, "2": 8.650168815069979e-09, "1": 0}, "score": 4.998903243382784}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7291092612107851, "3": 0.2624785800734729, "5": 0.007243263604865247, "2": 0.0011666212832300914, "1": 2.22835257747797e-06}, "score": 3.742424744193947}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7099042764056125, "4": 0.2898763576056213, "3": 0.00021884452757696597, "2": 4.851949829980239e-07, "1": 0}, "score": 4.709684487225633}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5361197653788428, "4": 0.46370579052919036, "3": 0.0001743381070929525, "2": 1.1280767042192383e-07, "1": 0}, "score": 4.535945197999764}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9002557044100233, "5": 0.09790721837883158, "3": 0.0018360741516324894, "2": 9.233679833900712e-07, "1": 0}, "score": 4.096069305147142}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970239999933996, "4": 0.002975736820183321, "3": 2.5245646978099564e-07, "1": 0, "2": 0}, "score": 4.997023758234943}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7426429363230161, "4": 0.2572965161029656, "3": 6.0421050229914794e-05, "2": 7.155038143005628e-08, "1": 0}, "score": 4.742582412994309}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9984434999047163, "4": 0.0015562254079446978, "3": 2.9443016285206075e-07, "1": 0, "2": 0}, "score": 4.998443185762465}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.684298673159794, "4": 0.3156050464876345, "3": 9.611636164772968e-05, "2": 1.3375019409416783e-07, "1": 0}, "score": 4.684202309988534}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8765613086042517, "5": 0.12059047233587265, "3": 0.0028406121621039255, "2": 7.435460821098024e-06, "1": 1.206385442081151e-07}, "score": 4.117734633317227}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992713909245954, "4": 0.0007285644986567533, "3": 3.840270258544416e-08, "1": 0, "2": 0}, "score": 4.99927135869144}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9621648608251395, "5": 0.03661700972321905, "3": 0.0012146470964217353, "2": 3.3988344293964832e-06, "1": 4.367478079250592e-08}, "score": 4.035395435343963}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9657643225995269, "5": 0.027735752335251114, "3": 0.006493767553388031, "2": 5.988581411569049e-06, "1": 0}, "score": 4.021230011205435}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8240800464836339, "5": 0.17362112436996835, "3": 0.00229695625468364, "2": 1.7611861976438318e-06, "1": 0}, "score": 4.171320664880353}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7241080625995956, "4": 0.27557002733057545, "3": 0.0003214707494238541, "2": 4.5520043432213625e-07, "1": 0}, "score": 4.723785669955565}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9965824257466303, "4": 0.0034167116373542026, "3": 8.391461081926286e-07, "2": 3.641584309969291e-09, "1": 0}, "score": 4.996581599077895}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9790144496097765, "4": 0.02096798559417186, "3": 1.7294673396955955e-05, "2": 2.2962621550274575e-07, "1": 0}, "score": 4.9789967353298294}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9498010285077433, "3": 0.032412747247296765, "5": 0.01769333259350855, "2": 9.234813928805753e-05, "1": 4.5677541504819033e-07}, "score": 3.985094517448537}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9424823524747425, "4": 0.057499904042862926, "3": 1.757874598786091e-05, "2": 5.949652080321731e-08, "1": 0}, "score": 4.942464753920596}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7685532481383334, "5": 0.23041802954235446, "3": 0.0010258774333931568, "2": 2.812921317148731e-06, "1": 6.788274217526351e-08}, "score": 4.229386314378971}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998155492131384, "4": 0.00018424889945865887, "3": 1.438834845451543e-07, "1": 0, "2": 0}, "score": 4.999815463322868}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941999595575006, "4": 0.005796379386835529, "3": 3.5190728427336668e-06, "2": 7.082909318212661e-08, "1": 1.3199168523262688e-08}, "score": 4.994196316847176}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9991143046298947, "4": 0.0008855263889497, "3": 1.407930155389633e-07, "1": 0, "2": 0}, "score": 4.99911419200005}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999932220207154, "4": 6.769183438620325e-05, "3": 1.8737855519660545e-08, "1": 0, "2": 0}, "score": 4.999932270685215}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.934203275230721, "4": 0.06576926151680804, "3": 2.7271946086818412e-05, "2": 6.994014724561914e-08, "1": 0}, "score": 4.934175976781763}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999214926618624, "4": 7.844671134963404e-05, "3": 1.63373653468157e-08, "1": 0, "2": 0}, "score": 4.999921520610444}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9868498226453278, "5": 0.01314658828536687, "3": 3.054123234952882e-06, "2": 5.351857751759101e-08, "1": 0}, "score": 4.013143433452587}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8325756503206871, "5": 0.16566927453790864, "3": 0.0017513033444356823, "2": 3.6949113342332176e-06, "1": 9.653530891815426e-08}, "score": 4.163910288544095}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6608187912883442, "4": 0.33907857967888905, "3": 0.00010246297952409792, "2": 1.0336494040690373e-07, "1": 0}, "score": 4.660716162998114}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.584173156059205, "5": 0.4149350819599091, "3": 0.000890133238734252, "2": 1.560291336457171e-06, "1": 2.2082310031898912e-08}, "score": 4.414041781090071}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9588073218292814, "4": 0.04118125507773674, "3": 1.126104649957333e-05, "2": 4.637292782666924e-08, "1": 0}, "score": 4.9587960789442755}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9962116287532622, "4": 0.003788104185290392, "3": 3.030242504958116e-07, "1": 0, "2": 0}, "score": 4.99621128990246}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9099129439832436, "4": 0.09006935448741989, "3": 1.7590351789706214e-05, "2": 2.087841472388222e-08, "1": 0}, "score": 4.909895394037388}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999713795214406, "4": 0.00028596046241645965, "3": 1.7893020917692196e-07, "1": 0, "2": 0}, "score": 4.999713681658442}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7406749825118134, "4": 0.25914389303283275, "3": 0.0001809420036260603, "2": 1.884095096930995e-07, "1": 0}, "score": 4.740493659277467}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8686564511767271, "4": 0.131308692042209, "3": 3.4578239152015316e-05, "2": 1.0159820187899818e-07, "1": 0}, "score": 4.86862182343834}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998757304221038, "4": 0.0001240903039188387, "3": 6.990483638800205e-08, "1": 0, "2": 0}, "score": 4.999875769872822}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8964002707624702, "5": 0.10145245640919935, "3": 0.002145183247888638, "2": 2.015982274912307e-06, "1": 2.6255692874827094e-08}, "score": 4.099303167130941}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998262719524653, "4": 0.00017352792856078242, "3": 1.0788931461834647e-07, "1": 0, "2": 0}, "score": 4.999826256276785}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7283781200147602, "5": 0.26905028063186326, "3": 0.0025663669970577944, "2": 4.991285830161025e-06, "1": 0}, "score": 4.266473995302161}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987799238987968, "4": 0.00121988620399662, "3": 1.864572214083018e-07, "1": 0, "2": 0}, "score": 4.998779740877362}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9980008010656533, "4": 0.001998982455781273, "3": 1.8171941778008525e-07, "1": 0, "2": 0}, "score": 4.998000654035888}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9886352077467573, "4": 0.011361457191680384, "3": 3.250242334307851e-06, "2": 3.798741535245483e-09, "1": 0}, "score": 4.988632030006388}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7571198089272925, "4": 0.2428046666115071, "3": 7.536949050872956e-05, "2": 5.823577385463787e-08, "1": 0}, "score": 4.7570443961978635}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9947799085783428, "4": 0.005219897047412482, "3": 1.975241463654818e-07, "1": 0, "2": 0}, "score": 4.994779707920738}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5454801298201665, "5": 0.4542140573944426, "3": 0.00030563040891816434, "2": 1.6691168445688994e-07, "1": 0}, "score": 4.4539081001817475}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5581491546944072, "4": 0.4415980057474045, "3": 0.00025236780270360907, "2": 2.640854795587897e-07, "1": 0}, "score": 4.557896374579087}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8054260877833732, "4": 0.19435256965125444, "3": 0.00021985682916095365, "2": 1.3359164796981126e-06, "1": 1.1475596577873364e-07}, "score": 4.805203243086815}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997117693464384, "4": 0.00028791104415548245, "3": 1.9079276460665998e-07, "1": 0, "2": 0}, "score": 4.999711707333179}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9827079290587261, "4": 0.017286270591140986, "3": 5.766005528143989e-06, "2": 4.8225158089265633e-08, "1": 0}, "score": 4.982702052962432}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999701251202631, "4": 2.9758581910249325e-05, "3": 1.093873147063196e-08, "1": 0, "2": 0}, "score": 4.999970219537489}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9425343487754166, "4": 0.05740697312621375, "3": 5.8225974822398326e-05, "2": 3.532552335723802e-07, "1": 0}, "score": 4.94247550947109}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8903664940065577, "4": 0.1096121996486422, "3": 2.1197199162302336e-05, "2": 5.1554001800542224e-08, "1": 0}, "score": 4.890345244975831}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9988368848433934, "4": 0.0011629267396407704, "3": 2.0223731548161385e-07, "1": 0, "2": 0}, "score": 4.998836668801806}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7236203012163561, "4": 0.27616394113152837, "3": 0.00021511818138399553, "2": 5.424656887910764e-07, "1": 0}, "score": 4.723404168277447}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998978924633294, "4": 0.00010206109024426456, "3": 1.5290287714720163e-08, "1": 0, "2": 0}, "score": 4.999897908326}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8300220601920982, "4": 0.16992682088347882, "3": 5.101029922703931e-05, "2": 1.0664396293077308e-07, "1": 0}, "score": 4.829970838249311}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"4": 0.960918733599699, "3": 0.02936823590785385, "5": 0.009625504351743381, "2": 8.709370064242277e-05, "1": 2.908166026202012e-07}, "score": 3.98008220577197}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9392029433712923, "4": 0.06078387129225721, "3": 1.3102048053698557e-05, "2": 2.478745892963762e-08, "1": 0}, "score": 4.939189846691807}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9080934165589025, "4": 0.09189478478810759, "3": 1.1727500548187905e-05, "2": 1.4640561138723604e-08, "1": 0}, "score": 4.908081711094638}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999629731405111, "4": 3.6899299161922076e-05, "3": 2.2410303638140406e-08, "1": 0, "2": 0}, "score": 4.999963055876346}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.975086466818564, "4": 0.024904568959368992, "3": 8.632978320068318e-06, "2": 1.8788007060299058e-07, "1": 3.156458729432621e-08}, "score": 4.975077472399113}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9018821514046811, "4": 0.09806615274797062, "3": 5.15200760522406e-05, "2": 1.126848333926217e-07, "1": 0}, "score": 4.901830462852256}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9944251832857155, "4": 0.00557401309848274, "3": 7.559035864881432e-07, "1": 0, "2": 0}, "score": 4.994424474828325}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.55208740657266, "4": 0.4476742641389931, "3": 0.00023799366554598454, "2": 2.3220551892148998e-07, "1": 0}, "score": 4.5518490055668}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9930754671308784, "4": 0.006922668239002209, "3": 1.8306142347931336e-06, "2": 1.2629493554530208e-08, "1": 0}, "score": 4.993073632495918}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9908556254369584, "4": 0.009142627154232424, "3": 1.630824243655143e-06, "2": 4.988462953416384e-09, "1": 0}, "score": 4.990854095211244}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9776257616291827, "4": 0.022366745479616243, "3": 7.416895385509265e-06, "2": 1.4652585974938356e-08, "1": 0}, "score": 4.977618375398894}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5535346318257026, "4": 0.44620762873934317, "3": 0.0002574810326976689, "2": 2.172521883270189e-07, "1": 0}, "score": 4.553276739056003}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9560014587908964, "4": 0.04399053860020736, "3": 8.006706940145523e-06, "2": 6.007645072771547e-09, "1": 0}, "score": 4.955993430407694}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961333136583062, "4": 0.0038664647141540697, "3": 2.393045089407564e-07, "1": 0, "2": 0}, "score": 4.996133056745184}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.678136149994693, "5": 0.31791481800302307, "3": 0.003923826316926746, "2": 2.487085305933462e-05, "1": 3.750876893669689e-07}, "score": 4.313940112079127}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"4": 0.806204569795663, "5": 0.1743609505456498, "3": 0.01915026740012438, "2": 0.00028316862208661067, "1": 9.510273648490734e-07}, "score": 4.15464150714047}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.999946523779904, "4": 5.3446949187432845e-05, "3": 5.081623702242375e-09, "1": 0, "2": 0}, "score": 4.999946542886272}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7602845255797892, "4": 0.23963237519980765, "3": 8.294000855493297e-05, "2": 1.3381106427939776e-07, "1": 0}, "score": 4.760201337258816}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999947998470209, "4": 5.130630509493217e-06, "3": 2.11018545490695e-09, "1": 0, "2": 0}, "score": 4.999994865148773}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99996356913662, "4": 3.633369537512146e-05, "3": 5.7664338370725835e-09, "1": 0, "2": 0}, "score": 4.999963654768435}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9726852920183275, "4": 0.027310528275999387, "3": 4.0567475559174395e-06, "2": 3.80296047943045e-09, "1": 0}, "score": 4.972681343564849}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9610367560812832, "4": 0.03894195791496359, "3": 2.114354288566463e-05, "2": 2.005964001474728e-08, "1": 0}, "score": 4.961015690048617}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9098412001761472, "5": 0.08523149958798933, "3": 0.004922611975601091, "2": 4.626661538258076e-06, "1": 0}, "score": 4.080299639235667}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9981469725791831, "4": 0.0018523558825771275, "3": 6.099608879191745e-07, "1": 0, "2": 0}, "score": 4.99814642408151}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997623992715251, "4": 0.0002374301697091181, "3": 6.628103691815091e-08, "1": 0, "2": 0}, "score": 4.999762437243445}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5836423314050136, "3": 0.41176523911836405, "2": 0.0025269819334703364, "5": 0.00206339127451474, "1": 2.0691058510942036e-06}, "score": 3.5852379862960455}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9982501910039817, "4": 0.001749266013299511, "3": 4.889097132496773e-07, "1": 0, "2": 0}, "score": 4.998249756072632}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9536910756960318, "5": 0.03810429780234999, "3": 0.008193193748900271, "2": 1.1348057205612696e-05, "1": 5.249835506158398e-08}, "score": 4.029888251406289}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992875835891616, "4": 0.0007123465766685668, "3": 2.0252896835907427e-08, "1": 0, "2": 0}, "score": 4.999287612882217}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8537450210274493, "5": 0.1244557808577342, "3": 0.021361105726672117, "2": 0.0004346820559411218, "1": 3.186631994548738e-06}, "score": 4.102215773988886}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8064142102358861, "5": 0.15255425129509526, "3": 0.04020455424891333, "2": 0.0008163590398136923, "1": 1.0430597540881193e-05}, "score": 4.110685708711462}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9723184322277237, "5": 0.01714764212919973, "3": 0.01051688729458704, "2": 1.679196600372268e-05, "1": 9.966771837719098e-08}, "score": 4.006596872867308}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9958097862467507, "4": 0.004188856474824031, "3": 1.3536119768336366e-06, "2": 4.2245926288204455e-09, "1": 0}, "score": 4.995808423629784}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988141656578796, "4": 0.001185524483742748, "3": 2.1350576549114173e-07, "2": 2.6749637716461615e-09, "1": 0}, "score": 4.998814040368736}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9684212797762166, "4": 0.03155332207422708, "3": 2.5027283204043735e-05, "2": 2.4804342631545723e-07, "1": 0}, "score": 4.968395875347375}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8028616510328557, "5": 0.19360741582346574, "3": 0.0035164757440269276, "2": 1.4228052698874713e-05, "1": 2.3938133801853356e-07}, "score": 4.1900617639228726}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.918571116997367, "3": 0.05714042753333664, "5": 0.02355775295904544, "2": 0.0007264571922152724, "1": 3.985985396015004e-06}, "score": 3.9649524439961152}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9677003871722414, "4": 0.032271567486140844, "3": 2.7927072475177974e-05, "2": 3.246562498927505e-08, "1": 0}, "score": 4.967672478198218}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8708789151421914, "4": 0.12901448423913098, "3": 0.00010602273560622968, "2": 5.430486099134491e-07, "1": 3.0247660327689345e-08}, "score": 4.87077171956044}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8803986612030007, "5": 0.09713462267898931, "3": 0.021247728148200123, "2": 0.001205515503243233, "1": 1.3377183850080477e-05}, "score": 4.073435738969909}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9220215616144636, "5": 0.07635356924111637, "3": 0.0016229090990455195, "2": 1.8123087011153203e-06, "1": 3.17338469039549e-08}, "score": 4.074726948991665}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.525109850095839, "5": 0.471689537193019, "3": 0.0031980245113899923, "2": 2.3427080767291028e-06, "1": 0}, "score": 4.4684869422751206}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5803921982994448, "5": 0.4187750402578422, "3": 0.0008314831700542942, "2": 1.1782738847158184e-06, "1": 3.52642194632234e-08}, "score": 4.417941121802593}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998406931906776, "4": 0.00015922520089539904, "3": 3.1983266269496934e-08, "1": 0, "2": 0}, "score": 4.999840710824667}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999844149545944, "4": 0.00015576867559079493, "3": 3.973140118738155e-08, "1": 0, "2": 0}, "score": 4.999844151855054}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7721352422798614, "5": 0.217462403688374, "3": 0.01028038570209414, "2": 0.00011998245910400501, "1": 1.7566719087067956e-06}, "score": 4.20693683048199}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.991469532686714, "4": 0.008525846197796375, "3": 4.503953460979927e-06, "2": 1.5005020377615332e-08, "1": 0}, "score": 4.991465100008321}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9511007318658321, "4": 0.04887419164725401, "3": 2.480488371967292e-05, "2": 8.210967363193194e-08, "1": 0}, "score": 4.951075942985494}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998505818939973, "4": 0.00014935478126320843, "3": 1.964800559932082e-08, "1": 0, "2": 0}, "score": 4.9998506059162}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9969794455816184, "4": 0.003020111281788204, "3": 4.837783450018161e-07, "2": 2.733784292204411e-09, "1": 0}, "score": 4.99697891309121}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9928769374275133, "4": 0.007122393815657045, "3": 6.912695516674454e-07, "2": 3.450999285058288e-09, "1": 0}, "score": 4.992876213477202}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8176892700590761, "5": 0.17759620800059708, "3": 0.0046093814807949725, "2": 0.00010342353609327772, "1": 1.4386778872119937e-06}, "score": 4.172775711488026}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6750065395056626, "4": 0.3246162706262446, "3": 0.00037643016976428886, "2": 7.16678136644968e-07, "1": 1.3874780461967395e-08}, "score": 4.6746286540176145}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9996059856140641, "4": 0.00039387813442514887, "3": 5.754204148769043e-08, "1": 0, "2": 0}, "score": 4.999606006750482}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.974425551077625, "4": 0.025555559322321064, "3": 1.8747596508082734e-05, "2": 7.702991377124398e-08, "1": 0}, "score": 4.974406712732033}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8295646283247263, "4": 0.17037176102577514, "3": 6.34218575263276e-05, "2": 2.0306900287956148e-07, "1": 0}, "score": 4.829500788486387}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9305414946184691, "4": 0.06943768828575042, "3": 2.0613198158817538e-05, "2": 1.0207275434824175e-07, "1": 0}, "score": 4.930520772024956}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.866645324084713, "5": 0.13102641957104919, "3": 0.0023238429958461664, "2": 4.25935848243779e-06, "1": 5.118138219673567e-08}, "score": 4.128693917544923}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963985912848087, "4": 0.0036007446776817604, "3": 6.621279643943698e-07, "2": 6.107526340462349e-09, "1": 0}, "score": 4.996397912758933}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921927511275698, "4": 0.007805575444952144, "3": 1.6450841829676745e-06, "2": 7.2065175868029e-09, "1": 0}, "score": 4.992191112602074}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8342641918399937, "4": 0.1656788339308353, "3": 5.66893043968825e-05, "2": 8.832850159931641e-08, "1": 0}, "score": 4.8342074898806775}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9800750172822432, "4": 0.019916245968145906, "3": 8.736053630134246e-06, "2": 3.940618709905381e-08, "1": 0}, "score": 4.980066164477676}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8543083370045047, "4": 0.14564455214763292, "3": 4.684946353683206e-05, "2": 1.157991050787685e-07, "1": 0}, "score": 4.8542613803105885}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997720525239746, "4": 0.00022782608617697757, "3": 3.764619312614786e-08, "1": 0, "2": 0}, "score": 4.999772098602351}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992017686163097, "4": 0.0007967425143034605, "3": 1.104958257197451e-06, "1": 0, "2": 0}, "score": 4.999201047262455}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7471713395025213, "5": 0.25072734629750026, "3": 0.0020904402275385182, "2": 1.044518971379563e-05, "1": 1.546056740467321e-07}, "score": 4.24861562003821}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9575974573248424, "4": 0.04235918492726646, "3": 4.304506361428779e-05, "2": 2.258324464561083e-07, "1": 1.9591970950895467e-08}, "score": 4.957553966225367}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9940219570321167, "4": 0.005977254082530277, "3": 7.555959963272869e-07, "1": 0, "2": 0}, "score": 4.994021234526448}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999636883392843, "4": 3.6262369764072605e-05, "3": 3.4611428463545513e-09, "1": 0, "2": 0}, "score": 4.999963730706289}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9938165656053347, "4": 0.006182215355403781, "3": 1.1823258501812363e-06, "2": 6.5690474482953505e-09, "1": 0}, "score": 4.993815400099323}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9982290502852965, "4": 0.0017706727851736109, "3": 2.024293297903848e-07, "1": 0, "2": 0}, "score": 4.9982289222242215}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9973269720184172, "4": 0.0026727411106371524, "3": 2.394786663130738e-07, "1": 0, "2": 0}, "score": 4.9973267798053405}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8974423362386915, "4": 0.10253115247445012, "3": 2.6383361307738002e-05, "2": 1.398453035380476e-07, "1": 0}, "score": 4.897415662489804}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999970244320709, "4": 2.9708168984255423e-05, "3": 9.004071257054896e-09, "1": 0, "2": 0}, "score": 4.999970273821728}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997720525239746, "4": 0.0002279179185926955, "3": 1.694800007087822e-08, "1": 0, "2": 0}, "score": 4.999772048182533}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9983802868534847, "4": 0.0016191164172254678, "3": 2.988252149097478e-07, "1": 0, "2": 0}, "score": 4.998380285449826}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9707340860144716, "4": 0.029253475261585612, "3": 1.2294549793573594e-05, "2": 1.1272282506349679e-08, "1": 0}, "score": 4.970721897930866}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5370841730083811, "5": 0.46273418695901425, "3": 0.00018149508218970168, "2": 1.3093340523332556e-07, "1": 1.3272322301934696e-08}, "score": 4.462552390537504}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997927857718344, "4": 0.00020705150069818564, "3": 5.877354489714168e-08, "1": 0, "2": 0}, "score": 4.9997928309306765}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999583243784529, "4": 4.1593610343765416e-05, "3": 1.8633384490353132e-08, "1": 0, "2": 0}, "score": 4.999958369120249}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9437157664849963, "3": 0.029881566312331194, "5": 0.02631235969000817, "2": 8.989538074083212e-05, "1": 2.644983034093523e-07}, "score": 3.9962502085676905}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.961503798849105, "4": 0.03847856292137993, "3": 1.739918833927338e-05, "2": 1.1433809866859288e-07, "1": 2.1260881543609327e-08}, "score": 4.961486206660168}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6629804012116133, "5": 0.33596291403719153, "3": 0.0010534715819258465, "2": 2.882343152462699e-06, "1": 9.465539135044289e-08}, "score": 4.334903472897183}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999866940725246, "4": 1.320605660357146e-05, "3": 3.036081904530728e-09, "1": 0, "2": 0}, "score": 4.999986787869953}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9995647765372202, "4": 0.0004350573484708333, "3": 9.777391629771077e-08, "1": 0, "2": 0}, "score": 4.9995647470739515}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9944739968382834, "4": 0.005525160401798568, "3": 6.861613725026875e-07, "1": 0, "2": 0}, "score": 4.994473466410009}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9923555426314676, "4": 0.007641544779293567, "3": 2.8265179789461876e-06, "2": 8.443406466433962e-09, "1": 0}, "score": 4.992352776260892}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6402124401328334, "5": 0.35915813500531585, "3": 0.0006286625070690674, "2": 7.683157926247579e-07, "1": 0}, "score": 4.358527933729473}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9672832888699368, "4": 0.03271474778992831, "3": 1.8767087128799504e-06, "1": 0, "2": 0}, "score": 4.967281495958195}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9980554056782454, "4": 0.0019443502877581616, "3": 2.545903637819252e-07, "1": 0, "2": 0}, "score": 4.9980551405520455}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9985523654352588, "4": 0.0014452658429197748, "3": 2.358313059071918e-06, "1": 0, "2": 0}, "score": 4.998550017515869}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8421987310197356, "4": 0.15741691243656167, "3": 0.0003836215646628572, "2": 7.22607239211335e-07, "1": 0}, "score": 4.841813674655347}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9601964212311315, "4": 0.039784193254022306, "3": 1.923461572239252e-05, "2": 1.706855423461979e-08, "1": 0}, "score": 4.960177280979373}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.99983258867484, "4": 0.00016715283239715603, "3": 1.285721643463443e-07, "1": 0, "2": 0}, "score": 4.999832590001525}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9684792996330555, "4": 0.031491538131005054, "3": 2.8954700528279886e-05, "2": 9.393507357247088e-08, "1": 0}, "score": 4.968450267078657}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8724306171139734, "5": 0.12471077782486645, "3": 0.002853474227268753, "2": 4.918165317267885e-06, "1": 0}, "score": 4.121847493180095}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.995105145338084, "4": 0.004893534671051842, "3": 1.2825952418599381e-06, "2": 2.6477383875361465e-09, "1": 0}, "score": 4.995103892025121}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8070648375592488, "5": 0.19179344372304966, "3": 0.0011401694354864847, "2": 1.4014614121089433e-06, "1": 4.077543582344296e-08}, "score": 4.1906503694466695}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9990141206986459, "4": 0.000985648261267906, "3": 1.4533491489785617e-07, "1": 0, "2": 0}, "score": 4.999014060984403}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921419372770476, "4": 0.007856508361945208, "3": 1.4749565886932631e-06, "2": 6.590675433378302e-09, "1": 0}, "score": 4.992140521380573}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8629431197311556, "4": 0.13692106323176342, "3": 0.00013535873602861848, "2": 4.2515926374300026e-07, "1": 0}, "score": 4.862806939271564}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7430957746106992, "5": 0.25401176351114807, "3": 0.002884950606401518, "2": 7.333600222199619e-06, "1": 8.986421752570372e-08}, "score": 4.25111189816111}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9999598739650709, "4": 3.999888416957727e-05, "3": 1.285431865457523e-08, "1": 0, "2": 0}, "score": 4.999959975402618}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999615427524989, "4": 3.8340491535246223e-05, "3": 8.379613879047109e-09, "1": 0, "2": 0}, "score": 4.99996164274508}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99997334352929, "4": 2.6599503706528003e-05, "3": 1.0095682295464624e-08, "1": 0, "2": 0}, "score": 4.999973380303682}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7442305820907591, "4": 0.25560832157143015, "3": 0.0001603788065503657, "2": 5.686270874581876e-07, "1": 4.016479384646239e-08}, "score": 4.744069026445256}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9160226660665611, "4": 0.08396597682385867, "3": 1.1312208694864446e-05, "2": 6.639321914387444e-09, "1": 0}, "score": 4.916011375627249}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9878961253963333, "4": 0.012101195858281446, "3": 2.60450479166236e-06, "2": 6.478609065556511e-09, "1": 0}, "score": 4.987893574875953}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998362833730299, "4": 0.00016364485443674218, "3": 1.5178558954784053e-08, "1": 0, "2": 0}, "score": 4.999836324779182}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.956109324784305, "4": 0.043873402856049626, "3": 1.7121612561671805e-05, "2": 7.175559544867455e-08, "1": 0}, "score": 4.9560921351836935}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"4": 0.4804481138813716, "3": 0.4317549228222868, "2": 0.07666004745483365, "5": 0.0109200503267419, "1": 0.0002165755739652418}, "score": 3.42519513921351}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8411257380653518, "4": 0.15820117442556517, "3": 0.0006647270850273677, "2": 8.198191309793875e-06, "1": 1.6253068861365437e-07}, "score": 4.840444126755234}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8869575506793435, "4": 0.112002823296533, "3": 0.001026308084517769, "2": 1.24938379400389e-05, "1": 7.787825266096102e-07}, "score": 4.885903958719772}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9949777896823188, "4": 0.005007497448300336, "3": 1.4320027156928761e-05, "2": 3.1690208211891815e-07, "1": 4.356712433622189e-08}, "score": 4.994962737359572}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9170230139862281, "4": 0.08260845028461807, "3": 0.00036544710821943214, "2": 2.9160983986330485e-06, "1": 8.87962870786328e-08}, "score": 4.916651545040146}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9391544648449544, "3": 0.05570026357574729, "5": 0.004935681600652695, "2": 0.00020890916869722927, "1": 6.066150084959924e-07}, "score": 3.948815776044875}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5648029329028086, "4": 0.43241141257767374, "3": 0.002755736334602663, "2": 2.875117275714493e-05, "1": 1.1671531258832465e-06}, "score": 4.561986192684094}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9703785848205716, "3": 0.020542739694553242, "5": 0.009049591141732155, "2": 2.8875299987465177e-05, "1": 2.0061263045817807e-07}, "score": 3.988448498911927}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9818734270102644, "4": 0.018117462985638134, "3": 9.049165630749485e-06, "2": 4.7067033814238466e-08, "1": 0}, "score": 4.981864297232244}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8801785274353664, "5": 0.10942800878078851, "3": 0.010335951751063999, "2": 5.667683412169572e-05, "1": 5.65591924626754e-07}, "score": 4.098977033270582}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9962233412822333, "4": 0.003773633305918777, "3": 2.916970442418289e-06, "2": 4.0758476769868073e-08, "1": 0}, "score": 4.996220410221953}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6473811075186879, "4": 0.3524317825989817, "3": 0.00018608797727059307, "2": 8.554681277556423e-07, "1": 0}, "score": 4.647193416322048}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9171737115888622, "4": 0.0827175737109092, "3": 0.0001085336819976606, "2": 8.174395294473143e-08, "1": 0}, "score": 4.917065105459935}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999962734742367, "4": 3.718399987858787e-05, "3": 9.170812045670678e-09, "1": 0, "2": 0}, "score": 4.999962797655816}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9991321475020006, "4": 0.0008677848870475003, "3": 6.339378555149401e-08, "1": 0, "2": 0}, "score": 4.999132088321721}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7578343673106087, "4": 0.2420904650884972, "3": 7.459769122201774e-05, "2": 2.894390782217339e-07, "1": 0}, "score": 4.75775940327046}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9770550525107549, "4": 0.022939161954732265, "3": 5.713418653820913e-06, "2": 5.4609935602962005e-08, "1": 0}, "score": 4.977049246976379}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5992139895533579, "4": 0.4005544366449519, "3": 0.00023132729240259373, "2": 2.3460419954815e-07, "1": 0}, "score": 4.598982200183492}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999704827216435, "4": 2.945915000081421e-05, "3": 2.0893410808604203e-08, "1": 0, "2": 0}, "score": 4.999970499062078}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998089942439226, "4": 0.0001909240219299729, "3": 4.263019636144915e-08, "1": 0, "2": 0}, "score": 4.999808990710208}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.998993660000068, "4": 0.0010060364252078428, "3": 2.505560973439074e-07, "1": 0, "2": 0}, "score": 4.998993462409232}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9820957493020579, "4": 0.01790009963410145, "3": 4.205640321135882e-06, "2": 4.284315675432155e-09, "1": 0}, "score": 4.98209147728642}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9763653164112256, "4": 0.02362870482281595, "3": 5.965271428077137e-06, "2": 3.0269994155070257e-09, "1": 0}, "score": 4.9763593553058705}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992381872268098, "4": 0.0007615739342954481, "3": 1.528316267933288e-07, "1": 0, "2": 0}, "score": 4.9992381203369245}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9944967526526274, "4": 0.005502916800246502, "3": 3.494571103396197e-07, "1": 0, "2": 0}, "score": 4.994496384389606}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7358080911304608, "5": 0.26317238638119483, "3": 0.0010180945367384876, "2": 1.3051455380472964e-06, "1": 1.9800572213337466e-08}, "score": 4.262151649154725}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9888672468949687, "4": 0.011130936224795935, "3": 1.7150265438544387e-06, "2": 4.494793994478366e-09, "1": 0}, "score": 4.988865619153704}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.621637241127225, "5": 0.3774766751062559, "3": 0.0008851409146837889, "2": 9.268361870454205e-07, "1": 2.4647163846854648e-08}, "score": 4.376589603327166}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998421234138201, "4": 0.0001577845599548046, "3": 3.24837783470348e-08, "1": 0, "2": 0}, "score": 4.99984215046309}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997989830966056, "4": 0.00020084501841116087, "3": 5.550193233240623e-08, "1": 0, "2": 0}, "score": 4.9997990439543365}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5636341940617586, "5": 0.435745492007428, "3": 0.0006198523831295523, "2": 4.899034529752606e-07, "1": 0}, "score": 4.435124647479098}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8337593978764483, "5": 0.16428878755477064, "3": 0.001944077708956039, "2": 7.4238111542562e-06, "1": 1.4697828237907506e-07}, "score": 4.162329448246773}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.82086043326813, "5": 0.17764611954728912, "3": 0.0014922558659202065, "2": 1.0663638156164579e-06, "1": 0}, "score": 4.176151752964752}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9561437462957073, "4": 0.04384804697168309, "3": 8.085598837177264e-06, "2": 1.9406262765681093e-08, "1": 0}, "score": 4.95613571914965}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9979382288760699, "4": 0.0020614781602080906, "3": 2.2994331843083592e-07, "1": 0, "2": 0}, "score": 4.997938061823211}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.756918070951182, "4": 0.2429303262513574, "3": 0.00015091376152900448, "2": 5.422677249452681e-07, "1": 3.9471853052309725e-08}, "score": 4.75676603543688}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9710916538021601, "4": 0.02889679181174602, "3": 1.1398947857783365e-05, "2": 2.3568517964957277e-08, "1": 0}, "score": 4.971080335773356}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9225399248811567, "5": 0.0753845750372012, "3": 0.002073725356654562, "2": 1.7227150400878189e-06, "1": 2.8060358111640156e-08}, "score": 4.073307321825072}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998632156758288, "4": 0.00013669300308491106, "3": 1.574216587788802e-08, "1": 0, "2": 0}, "score": 4.99986327550225}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9999756083404814, "4": 2.4271372221530418e-05, "3": 3.650400315085582e-09, "1": 0, "2": 0}, "score": 4.999975721324146}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8291701314442484, "4": 0.17075780012886446, "3": 7.200363169586049e-05, "2": 9.584677637474817e-08, "1": 0}, "score": 4.829097910374195}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9827456805089272, "4": 0.017205974514198846, "3": 4.815931406025714e-05, "2": 1.672192518969341e-07, "1": 0}, "score": 4.982697204880799}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9022330969189347, "3": 0.0834610268830285, "5": 0.014175462528841927, "2": 0.00012990449907188557, "1": 2.8128625080007704e-07}, "score": 3.930453766940452}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979853648072419, "4": 0.0020144070396839924, "3": 2.5056311301285204e-07, "1": 0, "2": 0}, "score": 4.997985091879245}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.997346418288766, "4": 0.0026526461235552015, "3": 8.834121360417329e-07, "1": 0, "2": 0}, "score": 4.997345586913678}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"5": 0.628777953317362, "4": 0.37069289702064545, "3": 0.000528176209404867, "2": 8.382285843273306e-07, "1": 0}, "score": 4.628248185605024}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8355310652584726, "2": 0.1515162650089976, "4": 0.012896884608476303, "1": 3.9293674745273054e-05, "5": 1.6467315835616588e-05}, "score": 2.8613349635351906}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8552110913927407, "4": 0.14476321085389623, "3": 2.562297879267558e-05, "2": 2.038829245712372e-08, "1": 0}, "score": 4.855185474147718}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999222078259681, "4": 7.77558320055759e-05, "3": 1.3093433394648311e-08, "1": 0, "2": 0}, "score": 4.999922217979319}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6688462740079146, "5": 0.33030120446935146, "3": 0.0008508996980230996, "2": 1.5042945608260264e-06, "1": 0}, "score": 4.329447334902201}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8668716260536833, "3": 0.13024947878595594, "5": 0.002389733561015048, "2": 0.0004884128039292519, "1": 6.757700374940657e-07}, "score": 3.8711613924486006}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9084541465692468, "5": 0.0880303621129704, "3": 0.0035111684681268704, "2": 4.025888202538384e-06, "1": 0}, "score": 4.0845111669649965}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9708914906871917, "3": 0.025643893650888667, "5": 0.0034439035432337188, "2": 2.061416700189864e-05, "1": 2.126236985740777e-08}, "score": 3.977758716065562}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9352972741110605, "4": 0.06468585020014715, "3": 1.6736677320993878e-05, "2": 6.654216700061906e-08, "1": 0}, "score": 4.935280472128531}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9742998056767043, "5": 0.017205343066521297, "3": 0.00843170730660829, "2": 6.278646708430864e-05, "1": 2.9185667331310925e-07}, "score": 4.008647187823208}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9976051013566744, "4": 0.002394117959706199, "3": 7.553497121789806e-07, "2": 5.6492671961289145e-09, "1": 0}, "score": 4.997604354345911}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5479824818347102, "4": 0.45173412104512994, "3": 0.00028312954751297037, "2": 2.9354085736212814e-07, "1": 1.1927096601337213e-08}, "score": 4.547698708668982}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9994427157405882, "4": 0.0005570818950664822, "3": 1.4665924533075764e-07, "1": 0, "2": 0}, "score": 4.999442624755394}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998174524538312, "4": 0.00018239735163033227, "3": 9.244055940607162e-08, "1": 0, "2": 0}, "score": 4.999817417756707}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9912578269736908, "4": 0.008740892306157105, "3": 1.1772027317982953e-06, "2": 3.3256190490585043e-09, "1": 0}, "score": 4.991256742435519}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9866472722783273, "4": 0.013346528038272352, "3": 6.075216083924188e-06, "2": 4.3438486634134496e-08, "1": 0}, "score": 4.986641190131651}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8624552461022349, "5": 0.12232891957682997, "3": 0.015161278023188677, "2": 5.438365004065777e-05, "1": 1.2303893339412723e-07}, "score": 4.107058510447801}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9986493676260157, "4": 0.0013495815466843624, "3": 9.713023860384126e-07, "2": 1.515206516135685e-08, "1": 0}, "score": 4.998648430305344}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995632275928513, "4": 0.0004365130003354269, "3": 2.0623428676823617e-07, "1": 0, "2": 0}, "score": 4.99956307450786}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8139592953031606, "4": 0.1857790898702381, "3": 0.0002607668095515448, "2": 7.048886428601152e-07, "1": 0}, "score": 4.813697235179513}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9159113485962972, "4": 0.08403347900157677, "3": 5.512903663166189e-05, "2": 3.658692137064367e-08, "1": 0}, "score": 4.915856152594021}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9804618596308227, "4": 0.019534602476075864, "3": 3.5700641255325463e-06, "1": 0, "2": 0}, "score": 4.980458258024351}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7455061017764807, "4": 0.25437821094127044, "3": 0.00011562515749658341, "2": 2.9378109933774238e-08, "1": 0}, "score": 4.745390442271798}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974444904881448, "4": 0.0025546158982336802, "3": 8.392031720681361e-07, "1": 0, "2": 0}, "score": 4.997443705556333}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8328519863987739, "4": 0.1670721707065707, "3": 7.5534352892054e-05, "2": 1.1999365146766255e-07, "1": 0}, "score": 4.83277636907699}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9461622433851806, "4": 0.05382190169243607, "3": 1.5699149799098446e-05, "2": 6.890666012193134e-08, "1": 0}, "score": 4.9461464886099495}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8381480780445039, "5": 0.1588687324210769, "3": 0.002974727026478237, "2": 8.136397853765062e-06, "1": 0}, "score": 4.155877783432208}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7563869463110814, "5": 0.24192737528335606, "3": 0.0016845100988059814, "2": 8.771603693524839e-07, "1": 0}, "score": 4.240241180809163}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8975778243601562, "4": 0.10240084648047579, "3": 2.1284211590194264e-05, "2": 4.282293557368954e-08, "1": 0}, "score": 4.897556456409863}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7240468852938582, "5": 0.27528201436681893, "3": 0.000670232024704552, "2": 9.178709807944696e-07, "1": 0}, "score": 4.274609932991484}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8328876165688759, "5": 0.1634407074471207, "3": 0.0036632007202635417, "2": 8.159195373817345e-06, "1": 6.99546963092962e-08}, "score": 4.15976101779139}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9445537332272224, "5": 0.045950777948376646, "3": 0.00944230646262701, "2": 5.247330467860249e-05, "1": 6.980675237263321e-07}, "score": 4.036401431073858}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9508023327869519, "5": 0.036290335965562415, "3": 0.01288573362678484, "2": 2.1532912055958084e-05, "1": 9.184412411040886e-08}, "score": 4.023361260348374}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951273401122259, "4": 0.004870910979185776, "3": 1.77314810642206e-06, "2": 7.330178275448651e-09, "1": 0}, "score": 4.995125520887952}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8270342665935301, "4": 0.1727857139379603, "3": 0.0001793138384334265, "2": 5.78511159553521e-07, "1": 0}, "score": 4.8268539008415505}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9936458746796523, "4": 0.006353434793218481, "3": 6.877537394043885e-07, "2": 3.2861078395202595e-09, "1": 0}, "score": 4.993645179844236}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8604747217472295, "4": 0.13948906052099505, "3": 3.6026167808162504e-05, "2": 1.1859648360752844e-07, "1": 0}, "score": 4.8604385211704875}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993778246913766, "4": 0.0006219986099715622, "3": 1.25823085497098e-07, "1": 0, "2": 0}, "score": 4.9993777497122}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989565394839309, "4": 0.0010431649144273182, "3": 2.0301824197421926e-07, "1": 0, "2": 0}, "score": 4.9989564289524715}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9961379300496185, "4": 0.0038614056645333754, "3": 6.313509173911846e-07, "2": 4.85943335234175e-09, "1": 0}, "score": 4.996137316946885}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8113305213402572, "4": 0.18858595147968446, "3": 8.331682903207898e-05, "2": 1.715884431107446e-07, "1": 0}, "score": 4.811246892780363}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9448923880991519, "3": 0.038274565100425144, "5": 0.01597564825818131, "2": 0.0008515971258079695, "1": 5.580780035682517e-06}, "score": 3.9759811412665984}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9979079609704723, "4": 0.002091543434803053, "3": 4.5737372557529523e-07, "2": 7.569354832587054e-09, "1": 0}, "score": 4.997907519045543}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994302100919588, "4": 0.0005697083470081211, "3": 8.145509093871618e-08, "1": 0, "2": 0}, "score": 4.999430128742749}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9996918756000763, "4": 0.0003080184112473963, "3": 5.170781015570413e-08, "1": 0, "2": 0}, "score": 4.999691878156407}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8565874712894461, "4": 0.14330966507233256, "3": 0.00010222042979758329, "2": 5.149597987547274e-07, "1": 2.5480178519682924e-08}, "score": 4.85648423251907}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9977082089723626, "4": 0.00229040802598878, "3": 1.3617880215203583e-06, "2": 2.4544893706546476e-08, "1": 0}, "score": 4.9977067947709255}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.906467709945734, "4": 0.0934653125771898, "3": 6.660339538238249e-05, "2": 2.732135809045845e-07, "1": 0}, "score": 4.906400651550114}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993744927512759, "4": 0.0006251805937286714, "3": 3.042415130885884e-07, "1": 0, "2": 0}, "score": 4.999374210909219}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9941270336884019, "4": 0.005872277679763146, "3": 7.242754942637668e-07, "2": 4.466239757073484e-09, "1": 0}, "score": 4.994126260606123}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"4": 0.48654565888118073, "3": 0.40469446661532715, "2": 0.09753116607547652, "5": 0.011077004347140054, "1": 0.00015144303656345506}, "score": 3.410865722681017}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9230216948893425, "5": 0.0583244728070612, "3": 0.018187367851022214, "2": 0.0004591612970218375, "1": 7.281919958232638e-06}, "score": 4.039196937434491}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9522121998756741, "4": 0.04776400292845864, "3": 2.353342045702897e-05, "2": 2.1687211259866771e-07, "1": 2.1641501499518996e-08}, "score": 4.952188191840471}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9901384541056494, "4": 0.009846945238193378, "3": 1.4157854493492326e-05, "2": 3.288382001526151e-07, "1": 0}, "score": 4.990123751412687}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8979489956591035, "3": 0.07157077204633196, "5": 0.02924496081427489, "2": 0.0012319783340793472, "1": 3.12055714490514e-06}, "score": 3.9552008626965076}]