[{"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5864404210125074, "4": 0.40995931742486513, "3": 0.003598507869987176, "2": 1.6702353722497668e-06, "1": 4.8889460274776995e-08}, "score": 4.582838446150842}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9121570406830775, "4": 0.08737325936999883, "3": 0.00046897176213405584, "2": 6.52247986461422e-07, "1": 7.01220879868504e-08}, "score": 4.911686559359904}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6231217836028237, "4": 0.3760699934966216, "3": 0.0008079131442186942, "2": 2.509128924699531e-07, "1": 1.4792182576735343e-08}, "score": 4.62231335166996}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9881448126171205, "4": 0.011837634006821432, "3": 1.7405940534190142e-05, "2": 1.0380662952477675e-07, "1": 0}, "score": 4.988127242174225}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9999925349918634, "5": 6.7958121214316315e-06, "3": 5.496874461386165e-07, "2": 5.439666446206099e-08, "1": 0}, "score": 4.000006137331746}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6834514888178076, "5": 0.31005697750145805, "3": 0.00647122728432267, "2": 1.966942811414392e-05, "1": 4.2315554788420857e-07}, "score": 4.303545206796099}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6480937805696035, "5": 0.3490060575686885, "3": 0.002898656283172371, "2": 1.2705737345731006e-06, "1": 5.144801276496293e-08}, "score": 4.346104769323889}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7824953101533801, "5": 0.20527513042916626, "3": 0.01220820515032767, "2": 2.0900635348621255e-05, "1": 2.4078389668010087e-07}, "score": 4.1930244427412955}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7974111349991598, "4": 0.20231165985775046, "3": 0.00027646398462680745, "2": 7.410720373342671e-07, "1": 0}, "score": 4.797133188939352}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.557498648425322, "5": 0.4410311813613666, "3": 0.0014675117492365512, "2": 2.6021930179867877e-06, "1": 5.2777493319410505e-08}, "score": 4.439558308429239}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6802860346939952, "4": 0.3180564488017991, "3": 0.0016561419634042577, "2": 1.1849002075041107e-06, "1": 0}, "score": 4.678627651625526}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8858646635394436, "4": 0.11382797061644202, "3": 0.0003069090832507264, "2": 4.0237111602462335e-07, "1": 0}, "score": 4.885556997879182}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8528703465958206, "4": 0.14668464040946655, "3": 0.0004446885982372266, "2": 3.087771554491841e-07, "1": 3.651049804648841e-08}, "score": 4.852424913103619}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7494222669701424, "4": 0.2501980937207835, "3": 0.0003788758420833229, "2": 7.132827010173748e-07, "1": 6.818044796020678e-08}, "score": 4.7490417465414385}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.638700778201875, "5": 0.3598099153127802, "3": 0.00148336518302554, "2": 5.764564206934604e-06, "1": 1.5320499128214233e-07}, "score": 4.358314569818628}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5627877613390161, "5": 0.4312714813720157, "3": 0.00592708651216911, "2": 1.2408187760393762e-05, "1": 1.0748171541653072e-06}, "score": 4.425316433895333}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7858908844852202, "5": 0.21043156197120866, "3": 0.003673584465403678, "2": 3.807952175762181e-06, "1": 1.37044931189521e-07}, "score": 4.206749955445418}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9274885588948232, "3": 0.06649073927768112, "5": 0.005914379439933489, "2": 0.00010571666651363946, "1": 4.717630453405329e-07}, "score": 3.9392107833968875}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6254977789004631, "4": 0.3720931696572497, "3": 0.002403750627526144, "2": 4.5834342709938755e-06, "1": 5.554717967959415e-07}, "score": 4.623083295871608}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6222310887001327, "5": 0.37256666154710927, "3": 0.005191952750836164, "2": 9.670002402986324e-06, "1": 5.827450810458105e-07}, "score": 4.3673536368132515}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8657910944047132, "5": 0.1320581134328025, "3": 0.002149965464488892, "2": 7.255157904052185e-07, "1": 1.97118866483485e-08}, "score": 4.129906648384609}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5046762875485106, "5": 0.49400393314199936, "3": 0.0013190315313976206, "2": 7.784329317450831e-07, "1": 2.5427311110707285e-08}, "score": 4.492683240832069}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9714018078455587, "4": 0.02851002782741451, "3": 8.799478558126956e-05, "2": 2.9099728287845336e-08, "1": 0}, "score": 4.971313891273512}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6343267872717256, "4": 0.365390512526141, "3": 0.0002823892837856097, "2": 2.1272980449322022e-07, "1": 2.6582014406046205e-08}, "score": 4.634043938183973}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5178291590009698, "4": 0.4806267248327161, "3": 0.0015427395722225105, "2": 1.222570437096921e-06, "1": 6.614503538970557e-08}, "score": 4.516283821223077}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9462890376208183, "5": 0.04089802931915338, "3": 0.012803886773122, "2": 8.782187812321195e-06, "1": 1.3292178027062742e-07}, "score": 4.028076183088024}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.897332792138867, "5": 0.09237792830747264, "3": 0.010280349720807148, "2": 8.54243467538464e-06, "1": 0}, "score": 4.082080525515161}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9491647990206941, "4": 0.05081653933123506, "3": 1.863527999359438e-05, "2": 1.017745354543054e-08, "1": 0}, "score": 4.949146158753061}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9561999902373263, "4": 0.043784101804070885, "3": 1.587638139441901e-05, "2": 4.184807661865694e-08, "1": 0}, "score": 4.956184020338938}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8080944368508534, "5": 0.19068874262014338, "3": 0.0012148973394977493, "2": 1.7822605989807874e-06, "1": 4.130178985603343e-08}, "score": 4.189470175730445}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8345997670003145, "3": 0.0841077722085892, "5": 0.08119495210024881, "2": 9.600977968176058e-05, "1": 1.2279775624828766e-06}, "score": 3.9968914755574048}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.8716020882791152, "2": 0.08619220798533585, "4": 0.04214058451139456, "5": 3.8632989354740025e-05, "1": 2.647199966499588e-05}, "score": 2.9559726978787033}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9768886956943783, "4": 0.0230919109062353, "3": 1.921227807960698e-05, "2": 7.289979572951421e-08, "1": 0}, "score": 4.976869443334994}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9101706223124203, "4": 0.08956526514101185, "3": 0.00026254265339728793, "2": 1.146956093470525e-06, "1": 0}, "score": 4.909906170579892}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.865522489760853, "4": 0.13323262745607245, "3": 0.0012408355445923975, "2": 3.7419787833406594e-06, "1": 2.5747402389727235e-07}, "score": 4.864273439136511}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8050977019871899, "5": 0.1921682478091925, "3": 0.0027296906260448235, "2": 3.99950081852789e-06, "1": 2.2546768320573833e-07}, "score": 4.189429907277445}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7843149793032684, "4": 0.21505544508168561, "3": 0.0006274120852255024, "2": 1.8263374317689248e-06, "1": 2.767553317390924e-07}, "score": 4.783683131640686}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7764905705467253, "4": 0.2218538382949323, "3": 0.0016466367576266454, "2": 7.819085140161949e-06, "1": 9.454886057043464e-07}, "score": 4.774825606235798}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5499531424117352, "4": 0.4471291946794723, "3": 0.0029029088296384452, "2": 1.332420835744908e-05, "1": 1.1363320305013442e-06}, "score": 4.547020336740966}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.837793490712385, "4": 0.16200807488869967, "3": 0.00019726274241406701, "2": 9.83507080357348e-07, "1": 1.5489707079490022e-07}, "score": 4.837593824116561}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7245627206666421, "4": 0.274456472701349, "3": 0.000978075688323652, "2": 2.4898178569064598e-06, "1": 2.605307344965806e-07}, "score": 4.723578869709421}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9633293447020881, "4": 0.036567745412740334, "3": 0.00010249895034242022, "2": 2.8556690272888527e-07, "1": 5.982022634403077e-08}, "score": 4.963226158294522}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9960344401813798, "4": 0.003950409636512272, "3": 1.5135569321157683e-05, "2": 2.9754721847084836e-08, "1": 0}, "score": 4.9960192300209565}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994202100431919, "4": 0.0005787646729823147, "3": 9.977870102446846e-07, "2": 3.787718416692687e-09, "1": 0}, "score": 4.999419228376072}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7665775819047527, "4": 0.23302545091194765, "3": 0.00039529718850264206, "2": 1.605386532755527e-06, "1": 1.014863023285038e-07}, "score": 4.766178741229108}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6442754480230333, "5": 0.35357830667558304, "3": 0.0021437771122849343, "2": 2.345150450800959e-06, "1": 5.3430398107169835e-08}, "score": 4.351429703433609}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8566410182458691, "4": 0.1432202677361971, "3": 0.00013848514422544443, "2": 1.6630024125948923e-07, "1": 1.1955971216260181e-08}, "score": 4.856502207987245}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6476820607676327, "4": 0.35073767486140195, "3": 0.0015757612344616371, "2": 4.295979382504602e-06, "1": 1.0309942737630257e-07}, "score": 4.646097465507537}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9522996550599913, "4": 0.047679726137596544, "3": 2.043300647801771e-05, "2": 6.772238918217413e-08, "1": 0}, "score": 4.952279199047715}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5288222050133324, "5": 0.4693566273622543, "3": 0.0018185179914864532, "2": 2.616141593181934e-06, "1": 1.013530369018044e-07}, "score": 4.467532541300916}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9541698972779488, "4": 0.04574148156031836, "3": 8.816389786542711e-05, "2": 3.6414634624009776e-07, "1": 9.240238933769841e-08}, "score": 4.954080728562517}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9246085871958163, "4": 0.0753072927195976, "3": 8.395841006552854e-05, "2": 1.4021316011850842e-07, "1": 2.4997350442368305e-08}, "score": 4.924524270098272}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8239391902798107, "4": 0.17565511153685157, "3": 0.0004051914040121448, "2": 3.779204927843487e-07, "1": 2.2647463002736932e-08}, "score": 4.823533262561019}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9671423272755377, "4": 0.03280219975957995, "3": 5.512771355065977e-05, "2": 2.236038226234735e-07, "1": 4.4968076951404625e-08}, "score": 4.967086691605769}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9563059459348406, "4": 0.043605586766048365, "3": 8.808238396589234e-05, "2": 3.408339255991011e-07, "1": 3.8563369026557905e-08}, "score": 4.956217071469179}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9245053696548521, "5": 0.04954449124835637, "3": 0.025940832689798823, "2": 9.145066540372685e-06, "1": 6.992350347126218e-08}, "score": 4.0235851608110496}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6187187632561515, "5": 0.37942038247745963, "3": 0.001858090372698914, "2": 2.5939986305499962e-06, "1": 5.8017160469334267e-08}, "score": 4.377556972296298}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6410161483148041, "4": 0.3585761961371471, "3": 0.00040723412182838627, "2": 4.6353172856035067e-07, "1": 2.683749124403927e-08}, "score": 4.640607862451617}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7394206535638717, "5": 0.25928990990957046, "3": 0.0012886669074722358, "2": 6.529710777490187e-07, "1": 1.3738084092680951e-08}, "score": 4.2579999223964435}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9947799085783428, "5": 0.0027145627182121853, "3": 0.00249567860696707, "2": 9.603115316478306e-06, "1": 2.758656127871522e-07}, "score": 4.00019885027803}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9724805156612635, "4": 0.02748887504438752, "3": 3.04396659219441e-05, "2": 8.438594311379848e-08, "1": 0}, "score": 4.972449990117507}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8812608437207643, "4": 0.11802196827762736, "3": 0.0007141328846402702, "2": 2.606044508935871e-06, "1": 3.3484972093289546e-07}, "score": 4.8805405947757015}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9874270315878004, "4": 0.012539740973643382, "3": 3.297703987551759e-05, "2": 9.932932423241141e-08, "1": 2.137345725356843e-08}, "score": 4.987393919829849}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9896976970494522, "4": 0.01025480913015596, "3": 4.717058777337644e-05, "2": 2.565015832089641e-07, "1": 4.818654520416116e-08}, "score": 4.98964988725143}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6940675978337904, "4": 0.3049684348577781, "3": 0.0009616461523142038, "2": 2.236957218804789e-06, "1": 1.2687937563265292e-07}, "score": 4.693101067547029}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5649098602183581, "5": 0.42864087150566377, "3": 0.006425762359915907, "2": 2.289152049585354e-05, "1": 5.98177682023323e-07}, "score": 4.422167538418374}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5267355494956029, "5": 0.46948121114269264, "3": 0.0037797160168134753, "2": 3.4349849969487827e-06, "1": 1.059297180505201e-07}, "score": 4.465694299184564}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5081090444548204, "5": 0.4884238036065954, "3": 0.00346367089504333, "2": 3.263566311309645e-06, "1": 1.3149973507097678e-07}, "score": 4.48495325277479}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6548303267723448, "4": 0.3439279813732413, "3": 0.0012382143221925852, "2": 3.235762352899994e-06, "1": 1.7754637403232685e-07}, "score": 4.653585150261845}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7740007317340711, "4": 0.2254318687133588, "3": 0.0005669703774259417, "2": 3.6831105413623874e-07, "1": 0}, "score": 4.773433071808838}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8411823393205942, "3": 0.14794378625059834, "5": 0.010771049994935082, "2": 0.00010230193195442708, "1": 3.5282558344825273e-07}, "score": 3.8626215780938113}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9349850491829101, "5": 0.059672380728223076, "3": 0.0053328898606277994, "2": 9.42974031381302e-06, "1": 1.3352448068497486e-07}, "score": 4.0543202371670075}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9083541984918608, "5": 0.051468886474935804, "3": 0.04010259233504092, "2": 7.349457235370653e-05, "1": 5.305731497951944e-07}, "score": 4.0112177166136}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8807442855018544, "4": 0.1191121491317582, "3": 0.0001431344728492026, "2": 3.254734322437373e-07, "1": 0}, "score": 4.880600592915148}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8531823495094061, "3": 0.13829925875705643, "5": 0.008316057455329137, "2": 0.00020164577278375192, "1": 4.128943862722097e-07}, "score": 3.869612232533239}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7619822481179449, "5": 0.2362105289013606, "3": 0.0018042638675402484, "2": 2.434069524305938e-06, "1": 7.643646225325085e-08}, "score": 4.2344012727394755}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7769968365398983, "4": 0.22266470589792833, "3": 0.0003381280121538348, "2": 2.27724334204929e-07, "1": 0}, "score": 4.776658332162843}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.897313598395721, "4": 0.10234668052347053, "3": 0.00033923604328742034, "2": 4.1173742859507293e-07, "1": 2.017208740005784e-08}, "score": 4.896973526015729}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9415321394842133, "4": 0.058417007922381664, "3": 5.070824689216331e-05, "2": 1.2307240453587922e-07, "1": 1.4857753303037247e-08}, "score": 4.94148114656013}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8470769147596238, "5": 0.14706519310588928, "3": 0.005840325776795468, "2": 1.698654496389516e-05, "1": 1.4918062751496486e-07}, "score": 4.1411905074984485}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "human", "scores": {"2": 0.5829985556960379, "3": 0.3363502672337203, "4": 0.07175488808806468, "1": 0.006655111985526035, "5": 0.0022405990854761095}, "score": 2.4799270060359317}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6808199829462653, "4": 0.31860008968788445, "3": 0.000578628447812626, "2": 1.16647637334744e-06, "1": 8.777193801304706e-08}, "score": 4.680238788615972}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7984622169335946, "5": 0.19753942387585602, "3": 0.003992358978906959, "2": 5.9094015041948185e-06, "1": 7.39388822898481e-08}, "score": 4.193535027542473}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.908559818650303, "4": 0.0913367091909997, "3": 0.00010297039893699215, "2": 4.276567282360032e-07, "1": 5.913629337011813e-08}, "score": 4.90845582912565}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8011412703392172, "4": 0.19858630250827491, "3": 0.0002715416563426092, "2": 7.868824219563021e-07, "1": 3.6615543532962294e-08}, "score": 4.80086809472378}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8310871383476063, "3": 0.1443689504830604, "5": 0.021335524044006127, "2": 0.003187452724936658, "1": 2.0896309364858866e-05}, "score": 3.8705289742512936}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9353394102023674, "4": 0.06462044708056, "3": 4.0014246690513645e-05, "2": 2.3729591052538853e-08, "1": 0}, "score": 4.9352994464604985}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9993181792155, "4": 0.0006809759283113004, "3": 7.885760391495958e-07, "2": 7.088961365576532e-09, "1": 0}, "score": 4.99931742561915}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.995617372563838, "4": 0.004379419927535582, "3": 3.196292543460604e-06, "2": 2.043842764420711e-08, "1": 0}, "score": 4.995614126212542}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5687713334828739, "5": 0.4306301835565687, "3": 0.0005981003552199272, "2": 3.9206664454966307e-07, "1": 0}, "score": 4.430031294999401}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9550131623795486, "5": 0.03144280178791417, "3": 0.013531404984839726, "2": 1.2487155524446527e-05, "1": 8.523940585506197e-08}, "score": 4.017886167819304}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9266991153628639, "4": 0.07320603617555066, "3": 9.461921349924028e-05, "2": 1.693825619685975e-07, "1": 0}, "score": 4.926604212855887}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8500649165518993, "5": 0.14817062465069725, "3": 0.0017618075146014448, "2": 2.3864980919951116e-06, "1": 0}, "score": 4.146404082905475}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.801752373511327, "5": 0.19683044620569956, "3": 0.0014159777459090983, "2": 1.1127768499248149e-06, "1": 3.5035535168053644e-08}, "score": 4.195412148493353}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5212771921685272, "5": 0.4777782052155047, "3": 0.000943297351508295, "2": 1.177173890684673e-06, "1": 0}, "score": 4.476832614593976}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8486018127930625, "3": 0.10578855935983894, "5": 0.044859957378088997, "2": 0.0007435033398571331, "1": 6.09204948509882e-06}, "score": 3.937566110502564}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5753637669741898, "5": 0.41192005076677507, "3": 0.012606288528058592, "2": 0.00010446275098573988, "1": 5.182867932398632e-06}, "score": 4.399089387151837}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8545150191884284, "4": 0.1448726207840934, "3": 0.0006093483198383701, "2": 2.6442264312126505e-06, "1": 2.6121082423320227e-07}, "score": 4.853899689527503}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9869557118841885, "4": 0.01296212027465287, "3": 8.002583803485847e-05, "2": 1.579541409827209e-06, "1": 4.1693395874665814e-07}, "score": 4.986871419778641}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.873226191421098, "5": 0.11471813032368439, "3": 0.011913969020967271, "2": 0.0001354285991595468, "1": 6.072191379528298e-06}, "score": 4.10251510889889}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5118871798905082, "5": 0.48634147906053865, "3": 0.0017694142842734392, "2": 1.7851984008030173e-06, "1": 1.3625645886675163e-07}, "score": 4.484568088183057}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7067729714504748, "5": 0.24659050318578746, "3": 0.04597293615923312, "2": 0.0006552960760221533, "1": 8.001576285547364e-06}, "score": 4.1992830282470575}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5977420336258589, "4": 0.39942039308597926, "3": 0.0028351980084244176, "2": 2.0942323327982563e-06, "1": 1.2580465376523007e-07}, "score": 4.5949023620930864}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9700399352222179, "4": 0.029941434160068055, "3": 1.8549049687638872e-05, "2": 4.52261670762605e-08, "1": 0}, "score": 4.970021330972575}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9580219930692495, "4": 0.04195388248724296, "3": 2.4006690395147505e-05, "2": 2.178988425160699e-08, "1": 0}, "score": 4.95799803473167}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6329044475310621, "4": 0.36433970174391245, "3": 0.0027478502507817058, "2": 7.609858349468412e-06, "1": 3.950675792381838e-07}, "score": 4.630140189555658}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9035806129172395, "4": 0.09625425490366597, "3": 0.00016462588863182224, "2": 3.709876734845393e-07, "1": 6.585878555267825e-08}, "score": 4.9034151102136665}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8196324671442649, "5": 0.17622538616617742, "3": 0.004138942328467921, "2": 3.149515268449013e-06, "1": 7.206661048419349e-08}, "score": 4.172079925643989}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5284462403700012, "5": 0.4704438961998854, "3": 0.0011088303033954378, "2": 9.807100370727198e-07, "1": 4.1985563665461204e-08}, "score": 4.469332983415393}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8948740650939604, "3": 0.08298832033025208, "5": 0.020589690286364194, "2": 0.0015378692877030125, "1": 9.906232038862859e-06}, "score": 3.934495902939566}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "human", "scores": {"4": 0.49913693601769293, "5": 0.4972383949410199, "3": 0.003614665350978222, "2": 9.58599863137654e-06, "1": 4.280576303836843e-07}, "score": 4.493603268303219}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6752532522207624, "4": 0.32190741687949154, "3": 0.002831068717279051, "2": 7.240784507843093e-06, "1": 9.558794788412089e-07}, "score": 4.672404878350977}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5908158503869769, "5": 0.40783422435532707, "3": 0.0013487257785448573, "2": 1.0852653919567196e-06, "1": 4.872634441695668e-08}, "score": 4.4064832084865}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.679819790435404, "5": 0.31637416480807046, "3": 0.0038006886689449675, "2": 5.0314517359351514e-06, "1": 2.0404556708120504e-07}, "score": 4.312562838790992}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7678799601030816, "4": 0.23170026588605255, "3": 0.00041855439515727953, "2": 9.92945558183387e-07, "1": 9.662773742877702e-08}, "score": 4.767459229735846}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6505018415873467, "5": 0.34561732952771834, "3": 0.003874256521518233, "2": 6.363945572051049e-06, "1": 1.1296644604315337e-07}, "score": 4.341730038834328}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9715706696401795, "3": 0.016485204455795297, "5": 0.011928691862191311, "2": 1.5341576450464247e-05, "1": 6.511557949526266e-08}, "score": 3.9954126087812925}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8095842457007448, "4": 0.18967693426961094, "3": 0.0007379425366597534, "2": 8.180584893720973e-07, "1": 4.879831760446191e-08}, "score": 4.808844529255167}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7567076996748061, "4": 0.24295872646645644, "3": 0.0003330642978453434, "2": 3.686644338556478e-07, "1": 2.4041508011093117e-08}, "score": 4.756373914309605}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9465382500993205, "3": 0.030223119533996274, "5": 0.023212415327995076, "2": 2.5996178799339626e-05, "1": 1.2479630360492532e-07}, "score": 3.992936928383111}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6896512665162214, "5": 0.30546874906169075, "3": 0.0048640006533241156, "2": 1.5569790929286664e-05, "1": 3.4328082259019684e-07}, "score": 4.3005726002336235}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8010269075748719, "5": 0.1844522419922076, "3": 0.014497350070728072, "2": 2.2942487892173217e-05, "1": 3.581514125055389e-07}, "score": 4.169907966425967}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8332978230849036, "5": 0.13328402519189847, "3": 0.03337924431033735, "2": 3.8450225395045936e-05, "1": 2.964903990432568e-07}, "score": 4.0998270070014815}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5493653368768782, "4": 0.4498025546269779, "3": 0.0008310558975233338, "2": 1.0244220070333775e-06, "1": 2.9099931986656297e-08}, "score": 4.548532144329076}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8169357079975745, "5": 0.17199778158732004, "3": 0.011024347974864073, "2": 4.138266436384028e-05, "1": 7.792748727314137e-07}, "score": 4.1608883305397155}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9168018180360623, "4": 0.08291208080627667, "3": 0.00028502005834907474, "2": 9.861986816057077e-07, "1": 6.968142876139071e-08}, "score": 4.916514639649831}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7063858224769761, "5": 0.288741313706601, "3": 0.004865179829992921, "2": 7.212420130155268e-06, "1": 3.4339721451637185e-07}, "score": 4.283860715226872}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6893826720793975, "4": 0.30841395149671125, "3": 0.0022004442658105673, "2": 2.693457159754044e-06, "1": 1.4281467874382378e-07}, "score": 4.687176478346001}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9681288994323813, "4": 0.03182802143511008, "3": 4.283275261566279e-05, "2": 1.315736586926785e-07, "1": 0}, "score": 4.968085914674747}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5932215446549659, "4": 0.40440153342131313, "3": 0.002367153737974305, "2": 9.288067928674343e-06, "1": 3.012543236136672e-07}, "score": 4.590835016696979}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7994243842341988, "5": 0.13349737022833652, "3": 0.06700734759546825, "2": 7.03089820418369e-05, "1": 5.962546476341397e-07}, "score": 4.066347615420856}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9817032526559588, "3": 0.00916806526731374, "5": 0.009109619826773364, "2": 1.8888958744855786e-05, "1": 1.9048678783151207e-07}, "score": 3.9999032051832715}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9674856560269902, "4": 0.032489997702993725, "3": 2.4285550842662183e-05, "2": 3.998269905591159e-08, "1": 7.001019889528657e-09}, "score": 4.967461282796211}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9950280615086218, "4": 0.004969707965782004, "3": 2.1707496266433114e-06, "2": 9.141676900340659e-09, "1": 3.306254034691866e-09}, "score": 4.995025909649503}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.966253342342319, "5": 0.031662261381354806, "3": 0.0020832160530969424, "2": 9.851164297183226e-07, "1": 5.874587453867913e-09}, "score": 4.029577063068569}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.890123688561866, "5": 0.10550858024885891, "3": 0.0043640458702944385, "2": 3.6185650707687414e-06, "1": 6.290922642341526e-08}, "score": 4.101137108909583}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.925051710304811, "5": 0.040330950593209125, "3": 0.03458635634410549, "2": 3.0750386336563105e-05, "1": 1.445955937034009e-07}, "score": 4.00568266018845}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7874652234152523, "4": 0.21158835787625888, "3": 0.000945825941525962, "2": 5.412508430677382e-07, "1": 3.593802175838648e-08}, "score": 4.786518219410434}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9617515073997865, "4": 0.038239181320915, "3": 9.170754462486433e-06, "2": 1.922131533503588e-08, "1": 0}, "score": 4.9617424148654345}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6294322099611971, "5": 0.36768977465334535, "3": 0.002873372074674988, "2": 4.389501020910678e-06, "1": 9.97006141517599e-08}, "score": 4.36480738069494}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9767438944006983, "4": 0.023158045987018084, "3": 9.755277932641475e-05, "2": 4.063288621200772e-07, "1": 1.195907906080008e-07}, "score": 4.976645151550347}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.801666638696826, "3": 0.19030395917179482, "5": 0.005944351726198334, "2": 0.002064301430741497, "1": 2.0470985823955928e-05}, "score": 3.8114503243207847}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.985772152244107, "4": 0.01421743287626029, "3": 1.0371509315272817e-05, "2": 4.08353381207604e-08, "1": 0}, "score": 4.985761701563001}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9980358267179793, "4": 0.0019595880625447957, "3": 4.523108858470298e-06, "2": 2.5545721251892348e-08, "1": 0}, "score": 4.998031289010589}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9063868113127765, "4": 0.09347123846585585, "3": 0.00014143603394716568, "2": 3.771716304166832e-07, "1": 2.7911305922654618e-08}, "score": 4.9062446360770045}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9203040540568104, "5": 0.0698867852382904, "3": 0.009793063010749108, "2": 1.587808819715792e-05, "1": 9.502982949002751e-08}, "score": 4.060061688443911}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.83186174819768, "5": 0.15618833878956656, "3": 0.011932298450849666, "2": 1.7333248886422276e-05, "1": 2.5461556947560096e-07}, "score": 4.144220613844558}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.848831339702544, "5": 0.14886425925075109, "3": 0.0023040963925024575, "2": 3.553569712086602e-07, "1": 9.579303032105976e-09}, "score": 4.146559414571491}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9735254818613753, "4": 0.02644865427616361, "3": 2.557237220469778e-05, "2": 1.4479744531538252e-07, "1": 0}, "score": 4.973499762699696}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5822055004598148, "5": 0.41485995646631046, "3": 0.0029301812435482016, "2": 4.213124601180159e-06, "1": 9.55632982614685e-08}, "score": 4.411921084174152}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8403063426486419, "5": 0.15389111070606457, "3": 0.005800167398708298, "2": 2.2845282730169316e-06, "1": 5.180583755077823e-08}, "score": 4.148086225188044}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9663305877219626, "4": 0.03363762993952901, "3": 3.175018518640203e-05, "2": 8.528571135215584e-09, "1": 0}, "score": 4.966298843308202}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6532827251049779, "4": 0.3454107466904871, "3": 0.0013057815873205082, "2": 7.04208753419172e-07, "1": 0}, "score": 4.65197556274943}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9621935472359263, "4": 0.03777644948566024, "3": 2.9852827469955255e-05, "2": 3.158770103082112e-08, "1": 0}, "score": 4.962163745598957}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.876254215327601, "4": 0.12366920248295944, "3": 7.635569029501268e-05, "2": 1.3160629300652205e-07, "1": 0}, "score": 4.876177679567719}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9266889912303317, "3": 0.06031249999293936, "5": 0.01294287933972755, "2": 5.499765555021825e-05, "1": 4.6996998781215025e-07}, "score": 3.952518966442749}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8083654282624015, "5": 0.1911602495159927, "3": 0.00047394110265107776, "2": 4.172150669576788e-07, "1": 1.480989942069542e-08}, "score": 4.190685419846474}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7604865448075913, "5": 0.23512046010007143, "3": 0.004383641970431331, "2": 9.102522363930802e-06, "1": 1.2643809704161692e-07}, "score": 4.230718262416933}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5264408286256426, "4": 0.47308268312776824, "3": 0.0004753314061734104, "2": 1.0198408217032048e-06, "1": 3.0723192854560044e-08}, "score": 4.525963421265748}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5813867389157076, "5": 0.4181840802602343, "3": 0.0004287974049993061, "2": 2.789392000056521e-07, "1": 9.944024688377344e-09}, "score": 4.417754734637553}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8860336406207076, "5": 0.09751461644086974, "3": 0.016349973539817014, "2": 9.931062436879966e-05, "1": 2.4327530488320127e-06}, "score": 4.08095872549981}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7639192264093096, "5": 0.211272649906508, "3": 0.024622928925726376, "2": 0.0001807673884306096, "1": 4.209115615139971e-06}, "score": 4.186275599512545}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.738409507547125, "5": 0.24679333326952796, "3": 0.01469061829743, "2": 0.0001027264425973152, "1": 3.709088124872242e-06}, "score": 4.23188615925294}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8944318113160233, "4": 0.10539520892790687, "3": 0.00017187364039565598, "2": 9.17239702744233e-07, "1": 1.2025023183747855e-07}, "score": 4.894257803814629}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5514970661869554, "5": 0.44387375170047544, "3": 0.0045974613879930975, "2": 2.996043140659103e-05, "1": 1.6952946456449926e-06}, "score": 4.4392113121138195}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8320228871046821, "5": 0.15079175499537528, "3": 0.017161571669236524, "2": 2.2804104871160913e-05, "1": 6.900443265787632e-07}, "score": 4.133582544000408}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8454371568646548, "4": 0.15407277858328397, "3": 0.0004894276063427085, "2": 5.560692500510849e-07, "1": 8.298997662471259e-08}, "score": 4.84494636636408}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6133289094049136, "4": 0.38382020967786645, "3": 0.0028493482359365444, "2": 1.3577114947987156e-06, "1": 7.796701377694062e-08}, "score": 4.610476671062878}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9791646184458531, "4": 0.020797327211057884, "3": 3.7897326093025026e-05, "2": 1.2804091188424887e-07, "1": 0}, "score": 4.979126493409188}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997097471315166, "4": 0.00028906065875218155, "3": 1.0542467785540096e-06, "1": 1.1620709835453264e-08, "2": 9.249965640218023e-09}, "score": 4.999708756580851}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8112980363165373, "3": 0.10074486975477284, "5": 0.08708303414784153, "2": 0.0008607989399743063, "1": 1.3119944560879236e-05}, "score": 3.9845772045064223}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7751439228243866, "5": 0.2218749819732021, "3": 0.0029752997165504846, "2": 5.60850703228457e-06, "1": 1.4612681446791948e-07}, "score": 4.218888035804161}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5450403774494461, "4": 0.45445076457521133, "3": 0.0005079571318848195, "2": 8.735145940116168e-07, "1": 0}, "score": 4.544530688169778}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6603315642708062, "4": 0.33912924180305953, "3": 0.0005367618736883191, "2": 2.085925325427186e-06, "1": 2.139723576772852e-07}, "score": 4.6597900758237945}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6986691694413901, "4": 0.30090794246447433, "3": 0.0004212630910938175, "2": 1.3094085647340873e-06, "1": 8.679411648572155e-08}, "score": 4.698245186909568}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5451966629281138, "4": 0.4505791606752901, "3": 0.004215778529822023, "2": 7.904668687072103e-06, "1": 2.9690295570667365e-07}, "score": 4.540964290540709}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9364992199875961, "4": 0.06325400710136395, "3": 0.0002448048978424262, "2": 1.528929103469239e-06, "1": 2.1300802412461642e-07}, "score": 4.936250929871405}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8866641005457717, "4": 0.11242822060925839, "3": 0.0009011980618869375, "2": 5.269879821186303e-06, "1": 8.76757845129328e-07}, "score": 4.88575002842002}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6530877689057515, "5": 0.34489298447402045, "3": 0.0020159010748336077, "2": 3.33868680648168e-06, "1": 9.203333394796973e-08}, "score": 4.342870100721697}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9648961760662276, "4": 0.03506913780868848, "3": 3.44862797993762e-05, "2": 9.39295315666212e-08, "1": 0}, "score": 4.964861604121408}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7344560219305891, "4": 0.26460265323722154, "3": 0.0009393964156053124, "2": 1.7795162504613722e-06, "1": 9.196507054303561e-08}, "score": 4.733512832350016}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6378852058252196, "4": 0.36005168082075173, "3": 0.002055705871976979, "2": 6.933436362912938e-06, "1": 4.444003462681428e-07}, "score": 4.635814318728411}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5456615321197927, "4": 0.4511612340192212, "3": 0.00316509249336816, "2": 1.1525668113029762e-05, "1": 5.09624325158586e-07}, "score": 4.54247191696003}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8035214728638889, "4": 0.19594403426305235, "3": 0.0005325440184719863, "2": 1.756028206417904e-06, "1": 1.0500603628633473e-07}, "score": 4.802985172289329}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7802789461197472, "4": 0.2185025268461693, "3": 0.0012042865043259273, "2": 1.2941815206761816e-05, "1": 1.2763003713494504e-06}, "score": 4.779044964545548}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.645647041437989, "5": 0.3502357079078037, "3": 0.004099455987709266, "2": 1.704056295233424e-05, "1": 5.514547778906206e-07}, "score": 4.346100586566714}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5907365682198074, "4": 0.40859072349549874, "3": 0.0006721224612773873, "2": 5.633999895794317e-07, "1": 1.2427712238156705e-08}, "score": 4.590063287573519}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8555699362619336, "5": 0.13653068378292843, "3": 0.007889559309448844, "2": 9.610435679053393e-06, "1": 1.15131486598188e-07}, "score": 4.1286215704368106}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9608411310146482, "4": 0.03914028638898381, "3": 1.8451774744316993e-05, "2": 4.8988120843128754e-08, "1": 0}, "score": 4.960822659891145}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9431914921470376, "4": 0.056774357934617055, "3": 3.4029015507674194e-05, "2": 5.090763116354015e-08, "1": 0}, "score": 4.943157427332767}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5633786044686258, "4": 0.4354531917920012, "3": 0.001167874673989088, "2": 3.1535400618036656e-07, "1": 1.1690444946963477e-08}, "score": 4.562210065151479}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9612725398102524, "4": 0.03870105957973074, "3": 2.6292206328934503e-05, "2": 5.153807407494631e-08, "1": 1.0378203991981779e-08}, "score": 4.961246158079008}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9998743001608869, "4": 0.00012536250220010527, "3": 2.525410568659179e-07, "1": 0, "2": 0}, "score": 4.999874132405014}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9965952045067121, "4": 0.0034031935799315382, "3": 1.5629898507314254e-06, "2": 1.0971454308763612e-08, "1": 0}, "score": 4.99659364743079}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9998490324867421, "4": 0.0001508461673060759, "3": 3.202086869446202e-08, "1": 0, "2": 0}, "score": 4.999849089777476}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5967238353318035, "4": 0.4025240227715743, "3": 0.0007516385508720399, "2": 4.664751906311578e-07, "1": 3.1283970349259326e-08}, "score": 4.595971173308085}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7478836957965571, "4": 0.25151604355644863, "3": 0.0005982711970764337, "2": 1.8892644207864025e-06, "1": 4.62078564632059e-08}, "score": 4.747281547783564}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7288133102224621, "4": 0.27080028107538573, "3": 0.0003855814898041644, "2": 7.722086897052804e-07, "1": 3.9781892121846573e-08}, "score": 4.728426076057533}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9390926460978142, "4": 0.06083251176206628, "3": 7.459314090163934e-05, "2": 1.8329737554785632e-07, "1": 1.4501452791812896e-08}, "score": 4.9390176909358745}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8463166488363927, "4": 0.1535178088680757, "3": 0.00016528785967943462, "2": 2.5295202264901827e-07, "1": 1.4863058467881974e-08}, "score": 4.846150799162647}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8721794456049792, "3": 0.08719761494407821, "5": 0.03975943927637794, "2": 0.0008424805348839251, "1": 2.096986816308225e-05}, "score": 3.9508139512099785}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6716135689948813, "5": 0.32438107399884886, "3": 0.003998666693711586, "2": 6.193327841376938e-06, "1": 4.537724391127532e-07}, "score": 4.320368673175998}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5988782841070639, "4": 0.399853079738225, "3": 0.0012671588634326056, "2": 1.2810327108162716e-06, "1": 1.6177732245906897e-07}, "score": 4.597608098452514}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.858337998003494, "5": 0.12465747536155965, "3": 0.016974166641953784, "2": 2.9488417465656366e-05, "1": 8.129282375424388e-07}, "score": 4.107621899411694}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9116292880003043, "5": 0.0832051029085759, "3": 0.005160844758502895, "2": 4.506737764479983e-06, "1": 1.6683191973700617e-07}, "score": 4.078034751261447}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9572201520938776, "3": 0.034516113707491296, "5": 0.008230526442969293, "2": 3.301947562913875e-05, "1": 2.3250874493562336e-07}, "score": 3.973647677423514}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9289636435237745, "5": 0.05790705811610824, "3": 0.013114549712904381, "2": 1.4341014200711892e-05, "1": 2.3614897053094577e-07}, "score": 4.044763125604054}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9131723398890667, "4": 0.08643264836101061, "3": 0.0003941321495313843, "2": 7.018079821763364e-07, "1": 7.923054050646819e-08}, "score": 4.912776656396923}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983321581965542, "4": 0.0016664894347842541, "3": 1.2951889061193957e-06, "1": 0, "2": 0}, "score": 4.998330920091966}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7030173834164654, "4": 0.29628228901984305, "3": 0.0006992505075733161, "2": 9.643370177093219e-07, "1": 8.585019312862835e-08}, "score": 4.70231596555474}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7986167423078139, "4": 0.2003803637202915, "3": 0.0009999855790861192, "2": 2.4708187117472795e-06, "1": 3.539964330476438e-07}, "score": 4.797610819764454}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6444824418697385, "4": 0.3539159582879015, "3": 0.0015983842559494036, "2": 2.852582025416362e-06, "1": 1.4244099402625503e-07}, "score": 4.642878066922123}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5635475870497774, "4": 0.43388151025652344, "3": 0.002565154931600787, "2": 5.300462378420905e-06, "1": 3.6542491857274165e-07}, "score": 4.5609707808480335}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9833346867120396, "4": 0.016639598042177142, "3": 2.5456358585130842e-05, "2": 2.4913796938983136e-07, "1": 5.540777001773519e-08}, "score": 4.983308520957773}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5434722128710948, "4": 0.45388800336353874, "3": 0.002635406076852325, "2": 3.9691086892324965e-06, "1": 2.9980337315209454e-07}, "score": 4.540828027996099}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6372407317287379, "5": 0.35911342260091267, "3": 0.0036385319104294276, "2": 6.882820731488776e-06, "1": 4.5964058032205547e-07}, "score": 4.35545973592509}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.980828829862934, "4": 0.01914804801274869, "3": 2.3037505413083577e-05, "2": 1.0987274549153045e-07, "1": 3.767485278273296e-08}, "score": 4.9808053978666695}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9370631903595129, "4": 0.0626767821850634, "3": 0.00025952824950301365, "2": 3.839590233801971e-07, "1": 6.854070737071673e-08}, "score": 4.9368027323243275}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9481020043407205, "4": 0.05185109634388793, "3": 4.6743796790817885e-05, "2": 1.0316398782315174e-07, "1": 2.0090736475120956e-08}, "score": 4.9480550245316754}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7612053235165958, "4": 0.2383094356460945, "3": 0.00048410753314772834, "2": 9.269937625907607e-07, "1": 1.842251842791343e-07}, "score": 4.760718826121009}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8196100259145362, "4": 0.17931923963010127, "3": 0.0010698996713478617, "2": 7.711707671769969e-07, "1": 4.833402852604023e-08}, "score": 4.818538451406196}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5989470991752578, "5": 0.39405676754471897, "3": 0.006978887910812107, "2": 1.659762408923438e-05, "1": 5.021067954200621e-07}, "score": 4.387043234433671}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.599889204490558, "4": 0.39831568886584545, "3": 0.0017939650448704312, "2": 8.800897025088473e-07, "1": 1.4623213677554892e-07}, "score": 4.598093109516184}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5960551158106983, "5": 0.4028113664262465, "3": 0.0011311897771904005, "2": 2.3028708908196976e-06, "1": 2.0440042343770787e-08}, "score": 4.401675511464952}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7467165328232827, "4": 0.25280167270967896, "3": 0.00048104569132997096, "2": 6.719714382034248e-07, "1": 5.186477428725885e-08}, "score": 4.746234006205453}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6986793561121412, "4": 0.2999628036039245, "3": 0.0013535515001793306, "2": 4.04373414326289e-06, "1": 1.6579031660864263e-07}, "score": 4.697317275041601}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5567138140097705, "5": 0.4390164215002866, "3": 0.00426453129389051, "2": 5.176942121693967e-06, "1": 1.1995046152778974e-07}, "score": 4.434741148779265}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8923355589313511, "5": 0.10307982406299716, "3": 0.0045816458019555415, "2": 2.8247406581634152e-06, "1": 8.39773262613205e-08}, "score": 4.098492283002106}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972716081451017, "4": 0.002726130703132754, "3": 2.2619529062617643e-06, "2": 1.2562369992957114e-08, "1": 0}, "score": 4.997269307740436}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9395045040946323, "3": 0.0556465721357286, "5": 0.0037244130873780004, "2": 0.0011173080651596984, "1": 6.919334247303202e-06}, "score": 3.945822451471017}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9202343988790922, "5": 0.07071779785964918, "3": 0.00903874447258111, "2": 8.639256777249674e-06, "1": 2.7971796759284106e-07}, "score": 4.0616609443406695}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9484612191006345, "5": 0.043575448283432364, "3": 0.007861679645613118, "2": 9.687587868840268e-05, "1": 4.33576280052176e-06}, "score": 4.035507025262315}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8679308789835971, "4": 0.1311339577517954, "3": 0.0009321352833532299, "2": 2.682120084155289e-06, "1": 2.2660690876599569e-07}, "score": 4.866992803031935}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.969389394406008, "4": 0.030551973391019775, "3": 5.8320610628985646e-05, "2": 1.4582245746219148e-07, "1": 3.1674211642475325e-08}, "score": 4.969330817110899}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.928057218713755, "4": 0.07185431590456212, "3": 8.819070376466843e-05, "2": 1.9428085861630888e-07, "1": 0}, "score": 4.927968714054228}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5016129613426322, "4": 0.49583518290938705, "3": 0.0025502063538690423, "2": 1.5760150769211687e-06, "1": 3.8690567518135305e-08}, "score": 4.499059504198516}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9749700747689328, "4": 0.024943956763772045, "3": 8.573280644094116e-05, "2": 1.367445842116059e-07, "1": 1.7387835228960494e-08}, "score": 4.974884095790593}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5935728298455872, "4": 0.4021926002491219, "3": 0.004232192917688405, "2": 2.338449394894186e-06, "1": 2.8857410900859876e-08}, "score": 4.5893358791621175}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9483057524929229, "4": 0.051653542454937126, "3": 4.056739065177847e-05, "2": 4.6522628886724984e-08, "1": 6.530449891084359e-09}, "score": 4.94826515269687}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9658011256817913, "4": 0.03414523616706812, "3": 5.358126953140574e-05, "2": 4.028184362137901e-08, "1": 0}, "score": 4.965747479879754}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8520885207124278, "3": 0.1404207508829375, "5": 0.00741261870960514, "2": 7.788509176304766e-05, "1": 1.9026395348559767e-07}, "score": 3.866835522278505}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.864692479750423, "3": 0.12867466974874286, "5": 0.003924106880538438, "2": 0.002690317668396592, "1": 1.8203275637383108e-05}, "score": 3.8698141629787948}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.969626823062618, "4": 0.030333092522002256, "3": 3.990026869023613e-05, "2": 3.791852719910197e-08, "1": 1.1172024454009567e-08}, "score": 4.969586944389469}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8253478294880043, "4": 0.17442371434541942, "3": 0.0002280278015091126, "2": 3.221166789660618e-07, "1": 1.7172921930769545e-08}, "score": 4.825119179432246}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9443861493146928, "4": 0.055515234522275414, "3": 9.830575374712049e-05, "2": 1.9739875834744858e-07, "1": 1.8968995621989903e-08}, "score": 4.944287480658683}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5824157495317916, "5": 0.41510478360805997, "3": 0.0024752051438310173, "2": 4.057822736474892e-06, "1": 2.0571687637940068e-07}, "score": 4.412620844915797}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.944493333780846, "4": 0.05523328601041286, "3": 0.0002702986767987489, "2": 2.338366381414163e-06, "1": 7.015680048848881e-07}, "score": 4.944216292944359}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9856258695826609, "4": 0.014256325158172642, "3": 0.00011735594224599423, "2": 3.243234554024067e-07, "1": 4.3728621281373316e-08}, "score": 4.985507813894778}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9975387931483937, "4": 0.0024541438888479, "3": 6.967486605623339e-06, "2": 4.895496710912321e-08, "1": 2.668297807838232e-08}, "score": 4.99753166749216}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6093671435189427, "4": 0.38879547299306305, "3": 0.0018280352916175955, "2": 8.793594493436132e-06, "1": 4.7120339482400616e-07}, "score": 4.607520158094417}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7948047595186476, "3": 0.18164749693745208, "5": 0.02307970774770921, "2": 0.000464226025695879, "1": 3.720732501715341e-06}, "score": 3.84049258235914}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8262115619397873, "3": 0.16229276230550196, "5": 0.008856881070372585, "2": 0.002618403756823585, "1": 2.017262642596724e-05}, "score": 3.841266758720306}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6104262044313187, "4": 0.375270154644062, "3": 0.014280254501437445, "2": 2.2697335936265025e-05, "1": 4.800934809629689e-07}, "score": 4.59609923955859}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6890064683406439, "4": 0.31051809572475403, "3": 0.0004748602536774869, "2": 5.353463052102101e-07, "1": 3.308340631680943e-08}, "score": 4.688530443136817}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5267756672027153, "5": 0.4699685506629147, "3": 0.0032463629551926997, "2": 8.96929930795404e-06, "1": 2.76798785737225e-07}, "score": 4.466703499490296}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7878803584733822, "4": 0.20993708256271076, "3": 0.002178077874630815, "2": 4.0673413618616e-06, "1": 3.985870174776785e-07}, "score": 4.785692962066785}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9961070664889714, "4": 0.0038830513655669485, "3": 9.784026021359482e-06, "2": 6.389364070492859e-08, "1": 3.3830604011414947e-08}, "score": 4.996097053577509}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7244449380793603, "4": 0.27437104769848863, "3": 0.001182683464440603, "2": 1.2573402258790054e-06, "1": 8.167833889808215e-08}, "score": 4.72325948892471}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8139148380605894, "4": 0.18474353740170354, "3": 0.0013390632187260214, "2": 2.2761833202919955e-06, "1": 1.788262809194724e-07}, "score": 4.8125707723802735}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9956313110059354, "4": 0.00435883830905804, "3": 9.810405008196698e-06, "2": 5.859069156468475e-08, "1": 3.147972969490467e-08}, "score": 4.995621239407953}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7546784156556958, "4": 0.2417799412978278, "3": 0.00353624588150352, "2": 5.033021793793049e-06, "1": 2.9195738123652e-07}, "score": 4.751131282079473}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5952536867608441, "5": 0.3974224334118851, "3": 0.0072715820327738595, "2": 4.932739261922003e-05, "1": 2.7585096664462212e-06}, "score": 4.39004400371216}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8450070825027753, "4": 0.15477707857671277, "3": 0.00021541040261550983, "2": 2.2656351769779446e-07, "1": 0}, "score": 4.844791389582445}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967991375181249, "4": 0.0031929181492907454, "3": 7.849293737207227e-06, "2": 7.723369588105876e-08, "1": 2.8603578630722147e-08}, "score": 4.996791037182483}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8348419779541817, "4": 0.1645030611722511, "3": 0.000652191713596667, "2": 2.508032441675366e-06, "1": 1.832447767493627e-07}, "score": 4.83418428540994}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8352020644948143, "4": 0.16420809229785802, "3": 0.0005884515279951464, "2": 1.161685023956157e-06, "1": 8.784016331097893e-08}, "score": 4.834611144719714}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.94451938704429, "4": 0.05532085039584246, "3": 0.0001587520510936465, "2": 8.320519151958052e-07, "1": 1.2657523025158164e-07}, "score": 4.944358640158539}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8976673442604153, "4": 0.10212917963305304, "3": 0.00020322354051068804, "2": 2.430817573967865e-07, "1": 1.9219585494499717e-08}, "score": 4.8974635681605365}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8451154531596135, "4": 0.15466501412773906, "3": 0.00021913534617039416, "2": 3.614164291795079e-07, "1": 2.8264195782284813e-08}, "score": 4.844895516681739}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9847044663418655, "4": 0.015266286173101275, "3": 2.9020676478833403e-05, "2": 1.3510224159512918e-07, "1": 4.601833191288191e-08}, "score": 4.984675082393724}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6961133170824949, "3": 0.3028145824175487, "5": 0.0007738503881675175, "2": 0.0002975310406803856, "1": 3.0950208752937485e-07}, "score": 3.697363153432318}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6572697278994118, "5": 0.33890183019004044, "3": 0.003823425998708891, "2": 4.723592145695544e-06, "1": 7.998177825731683e-08}, "score": 4.335068788209513}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9272428255351379, "5": 0.06297222013977608, "3": 0.009778061746560486, "2": 6.739909907292133e-06, "1": 0}, "score": 4.053180686692423}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7285670858068957, "5": 0.2670089501453701, "3": 0.004419087730542236, "2": 4.632517968515143e-06, "1": 8.330010727161104e-08}, "score": 4.262580389622489}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.734473840049814, "5": 0.26314849141335944, "3": 0.0023749440492109508, "2": 2.6549094747261538e-06, "1": 4.161342522449443e-08}, "score": 4.2607681199972305}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5624670074758529, "5": 0.4305647327430559, "3": 0.0069440229265155156, "2": 2.2817700168660337e-05, "1": 1.378977879849551e-06}, "score": 4.423570954500173}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8955693927280665, "4": 0.10393102718494719, "3": 0.000497806803992222, "2": 1.5867034434701796e-06, "1": 2.085085060785298e-07}, "score": 4.895067767363766}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7553959954114506, "5": 0.23070244861721492, "3": 0.013881101059449874, "2": 1.9765155377537555e-05, "1": 5.298091444843696e-07}, "score": 4.216780262493009}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9466616337219741, "4": 0.053195833679307206, "3": 0.00014193817251544874, "2": 4.2045011380216717e-07, "1": 3.321271674084837e-08}, "score": 4.946518888246271}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7984924632552338, "4": 0.20088949464337466, "3": 0.0006171178792734524, "2": 8.578908156870337e-07, "1": 7.938026906622872e-08}, "score": 4.797873381042098}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8638726559393388, "5": 0.11851822888315666, "3": 0.017576021862796973, "2": 3.204498054894998e-05, "1": 9.066639161383653e-07}, "score": 4.100875411358556}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9295555353992708, "3": 0.040845402904758465, "5": 0.0285017981703889, "2": 0.001089560908652464, "1": 7.3523321187421725e-06}, "score": 3.985455211357151}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8921530503594722, "3": 0.08152088776315018, "5": 0.02624557698371506, "2": 7.940223829461628e-05, "1": 7.339932533466184e-07}, "score": 3.944563663435665}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9662851731842054, "4": 0.033643173877751, "3": 7.121379559203246e-05, "2": 3.079313402776241e-07, "1": 6.273583634686016e-08}, "score": 4.96621322148014}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5067678144252707, "4": 0.4916664202809223, "3": 0.0015636788450253292, "2": 1.9967394155536434e-06, "1": 8.463110216604287e-08}, "score": 4.505199890773647}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9006748169533888, "3": 0.07310527890434858, "5": 0.026119591867059082, "2": 9.94240024611056e-05, "1": 8.564833148421067e-07}, "score": 3.952812894007793}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6870597487620146, "4": 0.31145204538668975, "3": 0.0014858667603459524, "2": 2.2514795051498525e-06, "1": 7.088577912802756e-08}, "score": 4.685569177851922}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5729495909766871, "5": 0.4247774050872402, "3": 0.0022708194986887343, "2": 2.060594550617481e-06, "1": 1.1677299505565031e-07}, "score": 4.422502117067487}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9548267390876786, "4": 0.045129131939262386, "3": 4.406238884771579e-05, "2": 5.16700772284847e-08, "1": 7.658191329029698e-09}, "score": 4.954782557311951}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.710896904781337, "4": 0.28815896192117196, "3": 0.0009426087129394676, "2": 1.293111795252436e-06, "1": 1.431692986940923e-07}, "score": 4.709951343028069}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9866765198969109, "4": 0.013309269920938659, "3": 1.4040648092464854e-05, "2": 3.127521206377872e-08, "1": 0}, "score": 4.98666255311322}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9840672930718952, "4": 0.015911247975765007, "3": 2.1467486999281047e-05, "2": 1.3958740021850002e-08, "1": 0}, "score": 4.98404577553288}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9837028689292545, "4": 0.01627005951172071, "3": 2.7041171040945192e-05, "2": 3.373499874731898e-08, "1": 0}, "score": 4.983675756995839}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969294448268614, "4": 0.003066944162246315, "3": 3.6213886525776867e-06, "2": 2.870544531350028e-08, "1": 0}, "score": 4.996925727064266}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989605845668361, "4": 0.0010380340409776715, "3": 1.3715473540065268e-06, "2": 1.4099507066444908e-08, "1": 0}, "score": 4.998959180570222}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8189954014336166, "5": 0.1710938230736707, "3": 0.009893081544783997, "2": 1.7247195627880448e-05, "1": 4.448961290017418e-07}, "score": 4.161164912748394}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9802751023768617, "4": 0.019717657990889998, "3": 7.184353655216688e-06, "2": 2.6383658886877122e-08, "1": 0}, "score": 4.980267893580666}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8299704178261238, "4": 0.16988804800710666, "3": 0.0001415367722619204, "2": 5.058367202402321e-08, "1": 0}, "score": 4.82982873574862}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9752073050702218, "4": 0.024790637927667426, "3": 1.972489711913367e-06, "2": 4.056448499381917e-09, "1": 0}, "score": 4.975205402928691}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8292166906542666, "4": 0.17060167938179546, "3": 0.00018092065372930102, "2": 6.402968115839241e-07, "1": 3.2410998884882294e-08}, "score": 4.829034422518566}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9635995820303237, "5": 0.023043646210764785, "3": 0.013337248755266446, "2": 1.9252319711443342e-05, "1": 2.420230179057217e-07}, "score": 4.009667167024092}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6399779732612418, "5": 0.3562666185235948, "3": 0.003751698905970655, "2": 3.5829717647865945e-06, "1": 6.92724885633476e-08}, "score": 4.352507565972452}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.725693427145738, "4": 0.2734790663235198, "3": 0.000826886099296216, "2": 5.421419334254611e-07, "1": 9.151453727154039e-08}, "score": 4.724865172632604}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8439406050719377, "4": 0.15591214553805982, "3": 0.0001470229295524022, "2": 1.9794235203164274e-07, "1": 2.0678258554818807e-08}, "score": 4.84379313083811}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5790548347123144, "5": 0.418679595553412, "3": 0.0022634175899285173, "2": 1.9869157418485824e-06, "1": 6.634569244359286e-08}, "score": 4.416412046270958}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6595295705488541, "5": 0.33821185158712513, "3": 0.0022551675663175187, "2": 3.247195036404411e-06, "1": 1.450061038347145e-07}, "score": 4.3359497606919595}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9741421942552315, "4": 0.025840661514217662, "3": 1.6977646345975582e-05, "2": 6.598779739291591e-08, "1": 1.0254061150781921e-08}, "score": 4.9741251418758585}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5663973983057032, "4": 0.4316656710358176, "3": 0.0019335511357900588, "2": 3.218719333616071e-06, "1": 1.2372085232604277e-07}, "score": 4.564457059500169}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5684693960762705, "5": 0.4309749979317918, "3": 0.0005550659069538582, "2": 5.341228330497746e-07, "1": 1.970217108331445e-08}, "score": 4.430418798758695}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8665290280858569, "4": 0.13332064334289143, "3": 0.00015011160607934242, "2": 1.6477334072536117e-07, "1": 2.7071671172560838e-08}, "score": 4.8663785274816505}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6969176670136311, "5": 0.30189904668262013, "3": 0.0011829452212536076, "2": 2.1019566540614133e-07, "1": 0}, "score": 4.300715720429762}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9818350414189826, "4": 0.018158055273627564, "3": 6.8754944293581066e-06, "2": 9.73471961775788e-09, "1": 0}, "score": 4.981828164204839}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9935336012252806, "4": 0.006466001937724028, "3": 3.3502958352181975e-07, "1": 0, "2": 0}, "score": 4.99353332760342}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9685469599602755, "4": 0.03144607829856371, "3": 6.864639725633799e-06, "1": 0, "2": 0}, "score": 4.968540189367192}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9799219395602282, "4": 0.020060706053179063, "3": 1.7349740646702358e-05, "2": 2.514242949072106e-08, "1": 0}, "score": 4.979904519450125}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "human", "scores": {"3": 0.763142669690226, "2": 0.2273321306992568, "4": 0.009249651535548496, "1": 0.00025761882190548897, "5": 1.7948123300500972e-05}, "score": 2.7814381835633952}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8036220800501699, "5": 0.17773782637249816, "3": 0.01856103477898801, "2": 7.746378663771617e-05, "1": 1.5859420085763088e-06}, "score": 4.159017107636446}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9615110774604118, "4": 0.038438585237224356, "3": 5.0123028739681995e-05, "2": 1.0533606276893742e-07, "1": 1.6756040781835e-08}, "score": 4.96146078212034}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9004230684980893, "4": 0.09942503856580993, "3": 0.00015169995018321289, "2": 1.7378368513700592e-07, "1": 2.269616203730551e-08}, "score": 4.900270949746567}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9157491687953598, "5": 0.049154312236076074, "3": 0.0350319842174934, "2": 6.381252948389537e-05, "1": 7.227850224586231e-07}, "score": 4.013992534596665}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6371750101089896, "4": 0.36121822568688444, "3": 0.0016039927331551148, "2": 2.6721638047392954e-06, "1": 1.5009130920748826e-07}, "score": 4.635565190497663}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7179062424545847, "5": 0.27885041162377605, "3": 0.0032424835987426215, "2": 8.553175786138706e-07, "1": 1.6411557905513034e-08}, "score": 4.275606165562785}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9303837905055587, "5": 0.060426870327267686, "3": 0.009187705935004686, "2": 1.4918352269238473e-06, "1": 0}, "score": 4.05123618796645}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5972527430418954, "4": 0.40063251231288066, "3": 0.0021122184198412593, "2": 2.4776798005380175e-06, "1": 8.11131291920317e-08}, "score": 4.5951353065409695}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7852505030025562, "4": 0.21447581447531514, "3": 0.0002735533202208111, "2": 1.8482562942320955e-07, "1": 0}, "score": 4.78497653636776}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7496508456365812, "5": 0.2400712319223496, "3": 0.010217089699246165, "2": 5.865252099919936e-05, "1": 2.0539690802572704e-06}, "score": 4.229730704277767}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8609116784616734, "5": 0.10650745460406313, "3": 0.03255022818696187, "2": 2.9896803190180618e-05, "1": 6.64753195343456e-07}, "score": 4.073895444255192}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9535880864359352, "4": 0.04632582027526853, "3": 8.542737142774755e-05, "2": 4.6296471280902314e-07, "1": 6.28144936182924e-08}, "score": 4.953501678313574}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9718741443757558, "4": 0.028092973142988288, "3": 3.25162693012268e-05, "2": 1.4138827609068853e-07, "1": 0}, "score": 4.971841563822897}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9359512754525041, "4": 0.06389731099113397, "3": 0.00015080695240073507, "2": 4.278851579141771e-07, "1": 0}, "score": 4.935799779974805}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5861433469212574, "5": 0.41133652660245607, "3": 0.0025167210383004366, "2": 3.101762685015411e-06, "1": 8.89452344387986e-08}, "score": 4.408813422987616}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6928279701018509, "5": 0.29718810217453157, "3": 0.00996574067931295, "2": 1.7848519399243422e-05, "1": 2.383256073879494e-07}, "score": 4.287185978255432}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6637614341387342, "4": 0.3356332275177851, "3": 0.0006050424119462469, "2": 2.425713361833708e-07, "1": 1.4627098016461861e-08}, "score": 4.663155888388905}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9805048361769211, "4": 0.019456849724302647, "3": 3.820099483079046e-05, "2": 8.676695417838451e-08, "1": 2.110845850035394e-08}, "score": 4.980466403449207}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7353036395822125, "5": 0.2453871282990715, "3": 0.019240012193249518, "2": 6.705388554184222e-05, "1": 1.840890750409948e-06}, "score": 4.226007559148658}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5528696884413018, "5": 0.4452952026550819, "3": 0.0018319150204927231, "2": 3.002206619018688e-06, "1": 1.6559844253853774e-07}, "score": 4.443456797990518}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9638111529421465, "4": 0.036163516494422385, "3": 2.518595651340183e-05, "2": 3.601303070340454e-08, "1": 0}, "score": 4.96378599962084}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9139965611070495, "4": 0.08586231964103994, "3": 0.0001407134506967326, "2": 2.001747703969472e-07, "1": 0}, "score": 4.913855635219695}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9962607220764933, "4": 0.003737149215704197, "3": 2.039632323358457e-06, "2": 1.7275474503997626e-08, "1": 0}, "score": 4.996258719424601}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5693302266615953, "5": 0.4295104531082877, "3": 0.001157729638370656, "2": 1.6075906347466864e-06, "1": 5.9075473421470465e-08}, "score": 4.428349298475826}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8357704039837394, "4": 0.16400576489122265, "3": 0.00022323110005492412, "2": 4.7398886835984495e-07, "1": 6.437696204873623e-08}, "score": 4.835546083294125}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9348229312219913, "4": 0.06510522316739559, "3": 7.162094491711064e-05, "2": 1.2017846387394013e-07, "1": 2.1715881016259984e-08}, "score": 4.934751082143113}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7265161618782799, "4": 0.2713798714376444, "3": 0.002100689405067784, "2": 3.024284570721283e-06, "1": 1.6540927165047376e-07}, "score": 4.724408991123737}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9561582501501991, "4": 0.043761068670250564, "3": 8.016825054208616e-05, "2": 4.4329516592647955e-07, "1": 5.6020059779783385e-08}, "score": 4.9560770402649705}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989580875680797, "4": 0.001040973964238214, "3": 9.403666354636647e-07, "2": 6.021755553234197e-09, "1": 0}, "score": 4.998957127245484}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8940158049946152, "4": 0.10588867209899294, "3": 9.531312822225027e-05, "2": 1.4897311254539083e-07, "1": 1.4662127913972173e-08}, "score": 4.893920191181881}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8651456973424511, "4": 0.1346938033452537, "3": 0.00016005612867965932, "2": 3.0911297870402985e-07, "1": 3.7051796420369377e-08}, "score": 4.864984995752266}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9190737275509769, "5": 0.0656331089993225, "3": 0.015284124555898672, "2": 8.859315975462904e-06, "1": 1.4071954076343673e-07}, "score": 4.05033084560862}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9731591080391435, "4": 0.026824798557490058, "3": 1.591577185213512e-05, "2": 7.284674399139895e-08, "1": 2.4826927165450775e-08}, "score": 4.973143049903441}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.913733834003214, "4": 0.08618888964920683, "3": 7.665743178060999e-05, "2": 5.347016014244739e-07, "1": 4.410269258536469e-08}, "score": 4.91365601150827}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6027500373227975, "5": 0.3895634756266374, "3": 0.007668146872735311, "2": 1.73770880186231e-05, "1": 8.681650418328686e-07}, "score": 4.381858006330523}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7714108638631575, "4": 0.22828101203907872, "3": 0.0003076139408502643, "2": 3.9342554468134915e-07, "1": 6.264731585611224e-08}, "score": 4.771102316833609}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8981630024026598, "3": 0.09331666217396802, "5": 0.008256050116077742, "2": 0.00026285079662039125, "1": 1.3277218223156921e-06}, "score": 3.9144096940433117}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7787152754398785, "4": 0.22110782511482158, "3": 0.00017665285895484352, "2": 2.3770106075769527e-07, "1": 0}, "score": 4.778538154096335}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9556361926310962, "5": 0.02443355222662553, "3": 0.019731944663866848, "2": 0.00019487017312029147, "1": 2.966813727664597e-06}, "score": 4.004302968812754}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9505827475291576, "5": 0.029264903900890732, "3": 0.02013706162104342, "2": 1.50130610359876e-05, "1": 1.3449699233178663e-07}, "score": 4.009097413934894}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8777345990753266, "4": 0.12217876742511714, "3": 8.642383950642444e-05, "2": 1.8695722305061108e-07, "1": 2.3830036837294627e-08}, "score": 4.8776477288419695}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9311854380128826, "4": 0.06870790643401488, "3": 0.0001063627645013812, "2": 1.384726505183794e-07, "1": 2.0369401267435186e-08}, "score": 4.9310788619096755}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9915321112610721, "4": 0.008451401444033163, "3": 1.624892183508254e-05, "2": 1.8528011905388483e-07, "1": 3.07254664549535e-08}, "score": 4.991515421780296}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9557251454763461, "4": 0.04424418626507164, "3": 3.059203123736284e-05, "2": 6.423054246810575e-08, "1": 1.3500582557846427e-08}, "score": 4.955694383045121}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.777846208339751, "4": 0.22166966517070402, "3": 0.000483440408947373, "2": 5.904741374393383e-07, "1": 3.102030025017566e-08}, "score": 4.777361544128426}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9196024793305667, "4": 0.08030218884959424, "3": 9.47871221718272e-05, "2": 4.490942770890201e-07, "1": 5.055317926428383e-08}, "score": 4.919506683784272}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7170275106580308, "5": 0.27937950177726595, "3": 0.0035855908743642013, "2": 7.21340108599645e-06, "1": 2.0377772916990008e-07}, "score": 4.275778867117253}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9753763689838716, "4": 0.02460582685665557, "3": 1.764009715055003e-05, "2": 5.455251615863105e-08, "1": 7.927247192219554e-09}, "score": 4.975358695079379}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9333245614290429, "4": 0.06664546344602001, "3": 2.9800869113370423e-05, "2": 4.730404628357523e-08, "1": 0}, "score": 4.933294784435268}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8421913786569069, "5": 0.14282823850384072, "3": 0.014939568229444608, "2": 3.9663031522903865e-05, "1": 1.0665067179419915e-06}, "score": 4.127806155563866}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6800077117958785, "4": 0.31217935517785067, "3": 0.007631930891302402, "2": 0.00017761877818000857, "1": 3.2201423220188044e-06}, "score": 4.672010992603165}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5982996282082096, "4": 0.3986971790459375, "3": 0.0029989141674948835, "2": 3.949948567587262e-06, "1": 1.7849486565106242e-07}, "score": 4.595292368033157}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9870884495744712, "4": 0.012828012791462333, "3": 8.313905421636103e-05, "2": 2.512764775102913e-07, "1": 4.468312157650459e-08}, "score": 4.987004775204613}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9847785651866673, "4": 0.015127575629638162, "3": 9.352881381496308e-05, "2": 2.6120977939199487e-07, "1": 3.225747621341044e-08}, "score": 4.984684453518305}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.758824829041278, "5": 0.22766678233945237, "3": 0.013213684260190154, "2": 0.0002839606175549172, "1": 1.021027491599357e-05}, "score": 4.213854660103724}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7119221097307249, "5": 0.2783166457461061, "3": 0.009697908842127905, "2": 6.103195368749234e-05, "1": 2.109745993395163e-06}, "score": 4.268490395840756}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8437406992223789, "5": 0.1497691305843535, "3": 0.006467711127895703, "2": 2.201124717532779e-05, "1": 3.492974449265199e-07}, "score": 4.1432563631834975}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9514657906179866, "4": 0.04833116926788229, "3": 0.0002016479908994523, "2": 1.137536612302187e-06, "1": 0}, "score": 4.951262109732467}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5237036542325082, "5": 0.47292110568221074, "3": 0.0033336699325143774, "2": 3.309319122212953e-05, "1": 7.749982288162629e-06}, "score": 4.469498340735942}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8584407729644952, "5": 0.13603661520953003, "3": 0.005511070453520945, "2": 1.11533684783641e-05, "1": 2.911893773994282e-07}, "score": 4.130502377085456}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9351941445667962, "5": 0.053157115889727054, "3": 0.011638398873072458, "2": 1.006843777311632e-05, "1": 1.991815732180735e-07}, "score": 4.04149798562786}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5244382443618635, "5": 0.47395678610406067, "3": 0.001603999630338697, "2": 8.167935228800583e-07, "1": 3.8442700614197506e-08}, "score": 4.4723510917219}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9851842790286972, "4": 0.01480309793772371, "3": 1.2539210290271256e-05, "2": 5.179832624891592e-08, "1": 1.490588105785243e-08}, "score": 4.985171608369343}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9293453457597322, "4": 0.0705848180071157, "3": 6.960953520052508e-05, "2": 1.1184252296672514e-07, "1": 0}, "score": 4.929275619271835}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7697927008929965, "3": 0.22139266263944823, "5": 0.008497629812149571, "2": 0.0003156460711764503, "1": 1.2493664189368445e-06}, "score": 3.786469903182742}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9867236471596414, "4": 0.013266715161196036, "3": 9.590601015203349e-06, "2": 2.5541021271593425e-08, "1": 0}, "score": 4.986714026727568}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5919687101330281, "4": 0.4064814193073365, "3": 0.001548316604277291, "2": 1.3627702247255814e-06, "1": 5.815610362694461e-08}, "score": 4.590417572062667}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8640516688987516, "4": 0.1356393437379258, "3": 0.00030813055035717, "2": 7.95058611382659e-07, "1": 2.6374452596516716e-08}, "score": 4.863741899666917}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9330397971565126, "4": 0.06688167939164145, "3": 7.830665225652362e-05, "2": 9.62230406650016e-08, "1": 0}, "score": 4.932961410551441}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "human", "scores": {"1": 2.0863471129385223e-08, "2": 0, "3": 0, "4": 0, "5": 0}, "score": 1.0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7428193943924518, "5": 0.23703248019519757, "3": 0.020077921509485064, "2": 6.762350014807249e-05, "1": 2.448296699211764e-06}, "score": 4.216811995437488}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7154692484605748, "5": 0.2750813794005089, "3": 0.00944202319768213, "2": 7.076415951298851e-06, "1": 1.96364345054351e-07}, "score": 4.265624634508111}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8014319771231182, "4": 0.19767563474041489, "3": 0.0008904817050743065, "2": 1.6041316112251803e-06, "1": 2.6664944000886976e-07}, "score": 4.800537515745936}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9152604036892138, "5": 0.06825103364841714, "3": 0.01642060057179085, "2": 6.670777800981653e-05, "1": 1.2298086128447366e-06}, "score": 4.05169332936146}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8764762249276286, "4": 0.123151546085985, "3": 0.0003717839321464899, "2": 4.118564379079545e-07, "1": 3.288638811149601e-08}, "score": 4.876103518896272}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.990399260717984, "4": 0.009597496459380418, "3": 3.1268764218027115e-06, "2": 6.150791895016287e-09, "1": 0}, "score": 4.990396230280951}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9772211112645435, "4": 0.02276273067471427, "3": 1.6088352419446194e-05, "2": 5.930785960571299e-08, "1": 0}, "score": 4.977204914459789}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9817893036989322, "4": 0.018204024189996282, "3": 6.657373636911529e-06, "2": 1.5332547200076243e-08, "1": 0}, "score": 4.98178261507593}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9891277359757396, "4": 0.010859804135979392, "3": 1.234040154380297e-05, "2": 7.023704208868e-08, "1": 0}, "score": 4.9891153038137395}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8697604935536389, "3": 0.11899711855348832, "5": 0.011168574418092844, "2": 7.293608852114023e-05, "1": 7.040813031693977e-07}, "score": 3.892023452730782}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9233765910995219, "5": 0.06820766707478725, "3": 0.008411663704566242, "2": 3.96106353227383e-06, "1": 4.968568368337519e-08}, "score": 4.059787936214133}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7875215606924958, "5": 0.16148224184198137, "3": 0.050918009336428524, "2": 7.664309818110045e-05, "1": 1.3271576604340996e-06}, "score": 4.110406988890939}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8417675346271781, "5": 0.14641516452473902, "3": 0.01179941411516955, "2": 1.7359719616253008e-05, "1": 3.991717745675201e-07}, "score": 4.1345798506599065}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6669306976759227, "3": 0.32754350271852356, "5": 0.0051225393299438576, "2": 0.00040252755653829143, "1": 5.805627181746572e-07}, "score": 3.676772190629025}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9178355259917927, "3": 0.06724574055353472, "5": 0.014834466324025273, "2": 8.329816815247239e-05, "1": 6.908818582071427e-07}, "score": 3.947420042167143}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6146547935933923, "5": 0.38160127432022267, "3": 0.0037324627817519017, "2": 1.1021308749427585e-05, "1": 3.10389772065546e-07}, "score": 4.37784588974556}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9776155073663475, "4": 0.02234246391038388, "3": 4.188566138438755e-05, "2": 5.469481072142441e-08, "1": 0}, "score": 4.977573598700659}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9973465371724662, "4": 0.002650299570238856, "3": 3.170706893943191e-06, "1": 0, "2": 0}, "score": 4.997343359035764}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9886216971503263, "4": 0.011370772859033694, "3": 7.436702646744711e-06, "2": 1.0831048134076208e-08, "1": 0}, "score": 4.9886143203037}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9410960333823397, "4": 0.05886147953396189, "3": 4.2197186911886985e-05, "2": 1.3376718144749177e-07, "1": 0}, "score": 4.941053715587409}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7139062555573973, "5": 0.2810753489116317, "3": 0.0050153413203192975, "2": 2.938700738417386e-06, "1": 4.411120522647709e-08}, "score": 4.2760540175661195}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9837328644544434, "4": 0.01625721774332762, "3": 9.858239056254673e-06, "2": 1.1386333687759455e-08, "1": 4.390476823175842e-09}, "score": 4.9837230133449415}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938120964222881, "4": 0.006182824951890433, "3": 4.994206586609638e-06, "2": 1.4895688921316929e-08, "1": 0}, "score": 4.99380714151732}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992324771464658, "4": 0.0007670289598566222, "3": 4.4214940129599706e-07, "1": 0, "2": 0}, "score": 4.999232086701606}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8525099656336047, "5": 0.14325702277236765, "3": 0.004224535352332791, "2": 8.120409289095153e-06, "1": 2.194235404924953e-07}, "score": 4.139015607293796}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9788000366204523, "4": 0.021152647585010603, "3": 4.70324391334528e-05, "2": 2.1347267466209622e-07, "1": 7.136616210746451e-08}, "score": 4.97875236168557}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6792369793612544, "4": 0.3172681067316711, "3": 0.0034888748056828983, "2": 5.6048570823941484e-06, "1": 3.6048625808173825e-07}, "score": 4.675735863223593}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7558628232456857, "4": 0.24398144540561334, "3": 0.00015538121638807904, "2": 2.774561317611717e-07, "1": 0}, "score": 4.755706942038929}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8443906550836413, "4": 0.15536757778166155, "3": 0.00024115419880755068, "2": 4.626069793678104e-07, "1": 5.062015600244637e-08}, "score": 4.844148507979404}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8160663467758057, "4": 0.18297714951049515, "3": 0.0009538440208889437, "2": 2.282251733372322e-06, "1": 2.931603816619579e-07}, "score": 4.815107127468099}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8618646665552426, "4": 0.13787006435753793, "3": 0.00026466306335649133, "2": 6.302211798800641e-07, "1": 5.0420298244592304e-08}, "score": 4.861598527498206}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9340657566182076, "5": 0.058125675130132934, "3": 0.007805848644873685, "2": 2.634737503759134e-06, "1": 4.2223157942994654e-08}, "score": 4.050314432486494}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9972052139064731, "4": 0.0027931075102784696, "3": 1.6992339943632698e-06, "2": 1.2378372999682624e-08, "1": 0}, "score": 4.99720345697898}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7470931371712061, "4": 0.25259991640602136, "3": 0.0003063957472274915, "2": 4.5840535026785517e-07, "1": 2.611774156753919e-08}, "score": 4.746785795661767}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8664071246923908, "5": 0.07717600394476526, "3": 0.05638094681398813, "2": 3.53090589312674e-05, "1": 3.949228135003349e-07}, "score": 4.020723258815344}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8996777502974135, "4": 0.10029430151851296, "3": 2.7958144652699208e-05, "2": 2.6371366966075744e-08, "1": 5.095607208714324e-09}, "score": 4.899649686852921}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9714432030727777, "4": 0.028530610941020707, "3": 2.6048718104917014e-05, "2": 1.733195377680919e-08, "1": 0}, "score": 4.971417236198802}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9211643834445441, "4": 0.07880845428441097, "3": 2.7039034872812723e-05, "2": 5.903283632350472e-08, "1": 4.81877061762934e-09}, "score": 4.9211372665890245}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9501838165493129, "4": 0.04980957720938119, "3": 6.545361023009447e-06, "2": 8.598173843621687e-09, "1": 0}, "score": 4.950177303669216}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8653803307125272, "3": 0.1287149254811086, "5": 0.005761899985914696, "2": 0.00014196145228463015, "1": 8.082325584286994e-07}, "score": 3.876760617766135}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9956802424095063, "4": 0.00431066799343429, "3": 8.789862404765522e-06, "2": 1.2898664049524794e-07, "1": 1.242784778802732e-07}, "score": 4.995670868006751}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9603028284124484, "4": 0.039670319124849085, "3": 2.6746872696463926e-05, "2": 5.4034343597142855e-08, "1": 1.0847816732706419e-08}, "score": 4.960275980018381}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8737521803882803, "4": 0.12620433237839046, "3": 4.33968369869001e-05, "2": 4.6912906849729484e-08, "1": 7.360411466454642e-09}, "score": 4.8737086992052445}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9597536961015225, "4": 0.040232373359217435, "3": 1.3807398310498997e-05, "2": 5.330956851656306e-08, "1": 1.647249198021005e-08}, "score": 4.959739783877248}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5829016110973924, "5": 0.41561116722106567, "3": 0.0014844098397904266, "2": 2.7002154279696153e-06, "1": 5.615332169428167e-08}, "score": 4.4141212114630015}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8738014264489079, "5": 0.12129533768540086, "3": 0.004901044173180283, "2": 2.1294475033253923e-06, "1": 4.486750605823986e-08}, "score": 4.116389902037262}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7715499232037154, "4": 0.2280601657433322, "3": 0.0003897471743330277, "2": 1.8389240606811088e-07, "1": 1.1286167230409298e-08}, "score": 4.7711597502488035}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8644405018484631, "4": 0.13548598171394052, "3": 7.338918327712647e-05, "2": 5.148151632549852e-08, "1": 7.345800849326014e-09}, "score": 4.864367046810797}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.980915762612748, "4": 0.019074757783594437, "3": 9.495970568683597e-06, "2": 2.555021769450802e-08, "1": 5.087791451777035e-09}, "score": 4.980906154170953}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.739045492787287, "4": 0.2580229356870221, "3": 0.0029255376594315083, "2": 5.4512261115270035e-06, "1": 2.904283310622533e-07}, "score": 4.736108396490211}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9000084471316846, "5": 0.07537351693117514, "3": 0.024473514181694203, "2": 0.00014083423464633516, "1": 3.5257160767155466e-06}, "score": 4.0506077653205335}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.997290818773116, "4": 0.0027023851690282756, "3": 6.733705307924098e-06, "2": 4.500010562304807e-08, "1": 2.6247029925643682e-08}, "score": 4.997283907456078}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9993460359277764, "4": 0.0006532906030771907, "3": 5.69599702013066e-07, "2": 4.331776941565751e-09, "1": 0}, "score": 4.999345557137047}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.591806018054284, "4": 0.40115610425873216, "3": 0.0069651439802294705, "2": 6.961552187797573e-05, "1": 2.7997820026793856e-06}, "score": 4.584693429852359}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5116947618414583, "5": 0.48649629159786556, "3": 0.001808271251103603, "2": 6.520869011036267e-07, "1": 3.1470255722170916e-08}, "score": 4.484686617764699}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7072970540593334, "4": 0.29069964285123046, "3": 0.001999940197738479, "2": 3.1956150012633972e-06, "1": 1.5661480776087929e-07}, "score": 4.705290260306895}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9900151652861198, "4": 0.009924227392731359, "3": 6.0220092432392445e-05, "2": 2.1724480187818624e-07, "1": 4.0548501964082946e-08}, "score": 4.989954517193749}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9776714491038003, "4": 0.022265252491173265, "3": 6.30712826858423e-05, "2": 1.4887497160521485e-07, "1": 2.8827097694383398e-08}, "score": 4.977608041903534}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9854557760780116, "4": 0.014531392061020845, "3": 1.2666384037295814e-05, "2": 4.545627327477412e-08, "1": 8.59451180163462e-09}, "score": 4.9854431028020185}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8987624153705114, "5": 0.08518513774294718, "3": 0.01603138364685369, "2": 2.0548204358258116e-05, "1": 3.110127278630325e-07}, "score": 4.069111738749551}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.679469155063245, "5": 0.30960087841897466, "3": 0.010914704087230475, "2": 1.4504726443949695e-05, "1": 6.248595077990699e-07}, "score": 4.29865532997508}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8153299345444354, "5": 0.18347330479992802, "3": 0.0011952881415835523, "2": 1.2511567932508215e-06, "1": 8.578342765351204e-08}, "score": 4.182275281706233}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7941861256735264, "4": 0.2054240499454435, "3": 0.0003885564874050285, "2": 8.856296287324578e-07, "1": 1.7647581419838712e-07}, "score": 4.79379543185314}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5717282030638042, "5": 0.42704969106786306, "3": 0.001219818746154766, "2": 2.096540400647838e-06, "1": 1.4045537700591487e-07}, "score": 4.425825279219864}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8887102629781102, "5": 0.10905202685861301, "3": 0.002235668478748222, "2": 1.8619485706119662e-06, "1": 3.226002465469339e-08}, "score": 4.10681255345493}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8532644466647066, "5": 0.13101492905791917, "3": 0.01523505281289646, "2": 0.00048173017671803553, "1": 3.7252969171774037e-06}, "score": 4.114805253317193}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7372856331022474, "4": 0.26240837644345744, "3": 0.0003056417174525006, "2": 2.519739822008164e-07, "1": 1.5218302828918094e-08}, "score": 4.736979501878589}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9276564625048166, "4": 0.07230244738322084, "3": 4.09449940728891e-05, "2": 1.6546469303904092e-07, "1": 2.0948872722944e-08}, "score": 4.927615085428248}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.846001699933731, "4": 0.1533565004022647, "3": 0.0006400652075524249, "2": 1.495861893279549e-06, "1": 0}, "score": 4.845358844700413}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9797197182593506, "4": 0.020118212090505627, "3": 0.0001613184816567085, "2": 6.173893344320198e-07, "1": 1.233348281394628e-07}, "score": 4.97955680522535}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9810452765656587, "4": 0.018925891003513374, "3": 2.8773204592592617e-05, "2": 5.288310104831355e-08, "1": 0}, "score": 4.981016403817583}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9780354149476792, "4": 0.02186048521505461, "3": 0.00010345374017539834, "2": 5.497391191871491e-07, "1": 5.840875756792386e-08}, "score": 4.977930723614695}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9748379567518232, "4": 0.02514021056899754, "3": 2.1621680928526128e-05, "2": 6.03306240865354e-08, "1": 0}, "score": 4.974816361282914}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8140710677275588, "4": 0.18554535972630815, "3": 0.0003827619509530596, "2": 7.121971982838776e-07, "1": 3.6551120302104266e-08}, "score": 4.813686822052824}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6329278970752432, "5": 0.3639927242024412, "3": 0.0030756522081572075, "2": 3.4352203014801597e-06, "1": 2.186617110080906e-07}, "score": 4.3609095717821855}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5331841059061848, "4": 0.45932144413840814, "3": 0.007484137486610928, "2": 9.787544011034918e-06, "1": 4.116056936966303e-07}, "score": 4.525679218083963}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.865703099869836, "5": 0.12131046415712617, "3": 0.012978094256742137, "2": 7.969458577733268e-06, "1": 1.516990823075708e-07}, "score": 4.108315999776011}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8679688691495789, "4": 0.1318371671607524, "3": 0.00019364867389002095, "2": 2.459833466131709e-07, "1": 0}, "score": 4.8677747884136}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6310580019398481, "4": 0.3665809166118676, "3": 0.0023552744948109783, "2": 5.440617459243795e-06, "1": 2.9995991136579927e-07}, "score": 4.628690988060443}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7989548523550601, "5": 0.19460278459612587, "3": 0.006434854814743436, "2": 7.343345712868249e-06, "1": 8.474356692979387e-08}, "score": 4.188153003938739}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.760285065381994, "5": 0.2328826267952004, "3": 0.006825591329358751, "2": 6.365441274998694e-06, "1": 0}, "score": 4.226044383936664}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5897597077743926, "4": 0.4090011136837044, "3": 0.001238120840540237, "2": 1.0028656561293785e-06, "1": 3.095144966434854e-08}, "score": 4.588519502404543}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7961439561932849, "4": 0.20357632153765134, "3": 0.00027905169683281833, "2": 5.264112950519218e-07, "1": 0}, "score": 4.795863966406356}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8885630425441841, "5": 0.10329449455179464, "3": 0.008069134915742031, "2": 6.933914141714649e-05, "1": 3.5165822209451645e-06}, "score": 4.095076176507672}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6601817058229928, "4": 0.3348689559349718, "2": 0.0036190182195413863, "5": 0.0013264806125303462, "1": 3.804849959063956e-06}, "score": 3.333895300779996}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7701123851842735, "5": 0.22153614942309655, "3": 0.008338396894273126, "2": 1.2440802040780074e-05, "1": 2.7825413115019535e-07}, "score": 4.213172110653677}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8075355177684993, "5": 0.19083291964945182, "3": 0.0016300574815999646, "2": 1.2804781437249267e-06, "1": 0}, "score": 4.189200343710181}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5040654289456309, "5": 0.4947800295149128, "3": 0.001151302924633439, "2": 3.1593318266065125e-06, "1": 9.975945487041448e-08}, "score": 4.493622098540629}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9082924234235064, "4": 0.09164743426634157, "3": 5.997150651233014e-05, "2": 8.651197441899052e-08, "1": 1.4290955247042649e-08}, "score": 4.908232299597086}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6179053923844334, "5": 0.370901481558036, "3": 0.011095703696035025, "2": 9.408734547115793e-05, "1": 3.186332465219353e-06}, "score": 4.359608097641475}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6362180681247679, "4": 0.36021374053782257, "3": 0.0035483378372527363, "2": 1.8543263286861804e-05, "1": 1.3454137115187606e-06}, "score": 4.632628585265931}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7954111485704083, "4": 0.20305211677679155, "3": 0.0015294658839244784, "2": 6.523751265534479e-06, "1": 7.103720429488321e-07}, "score": 4.79386653157178}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8915570236604219, "4": 0.10826029637442211, "3": 0.00018172427357276923, "2": 7.671779919386451e-07, "1": 8.694796505871788e-08}, "score": 4.891373594719887}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6205569734118513, "4": 0.37725073614153715, "3": 0.002185811769956383, "2": 5.986946751984877e-06, "1": 4.999443723567744e-07}, "score": 4.618357682835794}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5823667704268564, "5": 0.41607335505462817, "3": 0.0015569917263268222, "2": 2.823529104317943e-06, "1": 6.22530691003543e-08}, "score": 4.414510528271506}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5757408688393919, "4": 0.42282768373038987, "3": 0.0014301842455041122, "2": 1.0791984157926139e-06, "1": 8.110858698398018e-08}, "score": 4.574308341954823}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8949775686341203, "4": 0.10481158178349931, "3": 0.00021070858349320776, "2": 1.2836873143461817e-07, "1": 1.873776183061714e-08}, "score": 4.894766541634998}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9275291745080896, "4": 0.07242860217061473, "3": 4.205665163951679e-05, "2": 3.99522837964041e-08, "1": 7.477749195013524e-09}, "score": 4.92748712611185}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8047886682033639, "4": 0.19512062927754578, "3": 9.059432362715844e-05, "2": 6.980424586616093e-08, "1": 6.691719302062853e-09}, "score": 4.804697939704608}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6957077543519682, "3": 0.29786265141986323, "5": 0.005470050119368521, "2": 0.000953353871041509, "1": 5.92250533566243e-06}, "score": 3.70568284464317}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8630297635698245, "4": 0.1366616111802657, "3": 0.00030792016904467246, "2": 6.362444449774684e-07, "1": 2.3468564315562217e-08}, "score": 4.862720539645979}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.854904031675118, "5": 0.07580010508417571, "3": 0.06920950986539968, "2": 8.522519089912647e-05, "1": 8.500930694376176e-07}, "score": 4.006417596342448}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.933805291341613, "4": 0.06602900921247015, "3": 0.00016522027076770046, "2": 3.345561864613172e-07, "1": 8.485482345792917e-08}, "score": 4.933639203192145}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8672300215065899, "5": 0.11097747790654328, "3": 0.021781687176320827, "2": 1.0605392073542023e-05, "1": 1.1481324329520924e-07}, "score": 4.089174243817852}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7266912879072058, "5": 0.2715923364517476, "3": 0.0017156796148169104, "2": 6.024127471964095e-07, "1": 4.293965839200742e-08}, "score": 4.269875336868076}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9719851756761372, "4": 0.027982213578216206, "3": 3.247938427178381e-05, "2": 5.0218768782249154e-08, "1": 0}, "score": 4.971952674721101}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5338186310189806, "4": 0.46384805409899466, "3": 0.0023315546550012195, "2": 1.5827748771037242e-06, "1": 5.820171588985884e-08}, "score": 4.531483799588749}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9935030063258773, "4": 0.006495543192155888, "3": 1.4195012222374177e-06, "2": 6.34553132576966e-09, "1": 0}, "score": 4.9935015986087175}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9789010089671911, "4": 0.0210905670015465, "3": 8.340186330972232e-06, "2": 2.6853518009825518e-08, "1": 0}, "score": 4.978892670862301}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9152561202805477, "5": 0.07998151767996528, "3": 0.004757372780413319, "2": 4.848976045228462e-06, "1": 7.613087029483612e-08}, "score": 4.075214223380006}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8301487312232374, "3": 0.1620200963338465, "5": 0.0077106175294762635, "2": 0.00012023631019396708, "1": 3.6814829662237036e-07}, "score": 3.8454489517875916}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6782108168951447, "4": 0.3206783445923454, "3": 0.0011090942364144288, "2": 1.7124867569633834e-06, "1": 6.95038284695521e-08}, "score": 4.677098063637324}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6881739491079019, "4": 0.3111549062415847, "3": 0.0006689405270959888, "2": 2.0185300691188823e-06, "1": 1.5732973673899963e-07}, "score": 4.687500518962705}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.640361723065232, "4": 0.35895968315132015, "3": 0.0006777425919520585, "2": 7.847983744417222e-07, "1": 2.8219714711965688e-08}, "score": 4.6396823506362415}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7934347206592713, "4": 0.20614928256404377, "3": 0.0004153734345748325, "2": 5.618994037279152e-07, "1": 7.012545392785567e-08}, "score": 4.793018006163952}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8131530774595587, "4": 0.18598841354091347, "3": 0.0008564368270612254, "2": 1.883100382184251e-06, "1": 1.5759411525063728e-07}, "score": 4.812292427218703}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9607730155580232, "4": 0.03912407392697625, "3": 0.00010261925215439067, "2": 1.34076540809134e-07, "1": 3.319920191558838e-08}, "score": 4.960670147665891}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9979062992555192, "4": 0.002092501581094945, "3": 1.222724490677167e-06, "2": 4.228333048188391e-09, "1": 0}, "score": 4.997905040343143}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9725475977358398, "4": 0.02743843805331143, "3": 1.3870961552181361e-05, "2": 3.839018534482234e-08, "1": 1.3610054716162125e-08}, "score": 4.972533649279849}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8800519316609665, "5": 0.06589270774301245, "3": 0.05385961714286588, "2": 0.000192296905027469, "1": 3.205972761224498e-06}, "score": 4.0116388816718365}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.67067914549556, "4": 0.3278757347015163, "3": 0.0014415793436204566, "2": 3.381831944099626e-06, "1": 1.7586520781850763e-07}, "score": 4.669230263356337}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6591650635808446, "4": 0.33842231863898625, "3": 0.0024109975402583166, "2": 1.5861973657953945e-06, "1": 3.8867982391603556e-08}, "score": 4.656750773872798}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9736850411593009, "4": 0.026239525451431104, "3": 7.482608528654449e-05, "2": 4.4758427184000916e-07, "1": 8.811632679544045e-08}, "score": 4.973609125270197}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.985108381385163, "4": 0.014840202437425428, "3": 5.10355555755873e-05, "2": 2.7086453822125705e-07, "1": 7.324674697009214e-08}, "score": 4.98505662032523}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6727770043065776, "5": 0.32647500093883314, "3": 0.0007472677524798401, "2": 7.5974650907036e-07, "1": 3.00299085573229e-08}, "score": 4.325726103156378}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9153408860748664, "4": 0.08447836609016397, "3": 0.0001801674250894168, "2": 4.358799393419521e-07, "1": 1.450503374416661e-07}, "score": 4.91515941126264}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9397145829351058, "4": 0.06023893951368234, "3": 4.633675811881242e-05, "2": 3.105754695402849e-08, "1": 1.4491942958347888e-08}, "score": 4.939668230083452}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998648843089473, "4": 0.0001347997788589032, "3": 2.387217951646819e-07, "1": 3.6226030316455583e-09, "2": 0}, "score": 4.999864708277186}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9797496991211689, "4": 0.020224090219823004, "3": 2.6058657586709674e-05, "2": 7.678803524578356e-08, "1": 3.261818115147072e-08}, "score": 4.979723430764489}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9365813030587647, "4": 0.06305850075782332, "3": 0.00035763880694969713, "2": 1.9513365693544124e-06, "1": 6.022025418306079e-07}, "score": 4.936217958563646}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6761075621433806, "4": 0.32314572387263757, "3": 0.0007432690245344449, "2": 2.9589413666531345e-06, "1": 3.2379313412138475e-07}, "score": 4.6753575134165475}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6978212484936286, "4": 0.2982010963794925, "3": 0.003970469219330291, "2": 6.75553762855323e-06, "1": 3.281788837302516e-07}, "score": 4.693836354566246}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9563783343404195, "4": 0.04351657843693677, "3": 0.00010390775744894105, "2": 8.813486903857771e-07, "1": 2.3644386842417845e-07}, "score": 4.9562720135298}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9434863968787915, "5": 0.02999499933642304, "3": 0.02646301979532105, "2": 5.474642435416992e-05, "1": 6.910642750956789e-07}, "score": 4.0034204140006615}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5258072070250782, "4": 0.4630489300620972, "3": 0.011051570880401528, "2": 8.654803328975046e-05, "1": 5.314774362685093e-06}, "score": 4.5145668166198325}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8996269019479546, "3": 0.05314010833399638, "5": 0.0469708209931387, "2": 0.0002580397281034554, "1": 3.827736200072087e-06}, "score": 3.9933031479768375}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9225302797766619, "4": 0.07689082656717924, "3": 0.0005774977567450647, "2": 9.476998488136797e-07, "1": 1.4901408578490306e-07}, "score": 4.921950715412227}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5012700255186414, "4": 0.49264369225503796, "3": 0.006076373042905784, "2": 9.53934245435066e-06, "1": 2.4562152549263343e-07}, "score": 4.495173898436472}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6434130252354597, "5": 0.3549037688201168, "3": 0.0016802703094963745, "2": 2.659586229738859e-06, "1": 8.49320764920751e-08}, "score": 4.35321799204776}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6434000412916189, "4": 0.3413280980201538, "2": 0.010530312248995253, "5": 0.004717169223901027, "1": 2.429300765133243e-05}, "score": 3.3401835675300946}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8108071548585687, "5": 0.11314581430844949, "3": 0.07491187921750486, "2": 0.0011110575160974225, "1": 2.39235554670697e-05}, "score": 4.0359400555217055}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5443055048287377, "4": 0.45340713698417956, "3": 0.002284347165119902, "2": 2.7949844915864307e-06, "1": 1.8990194062235534e-07}, "score": 4.542015012154663}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9299224810673211, "4": 0.07003452109468247, "3": 4.284973916943668e-05, "2": 5.93397758188723e-08, "1": 4.503423282201304e-09}, "score": 4.929879577485917}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8716409451663243, "4": 0.12787590212426767, "3": 0.0004781951716103082, "2": 4.384907618407606e-06, "1": 5.941405080604156e-07}, "score": 4.871152179019182}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6656014573162474, "5": 0.22670973050576612, "3": 0.10405394628995976, "2": 0.0034340567181529243, "1": 0.00020068400528129053}, "score": 4.115185633180819}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6875573257558314, "5": 0.3071300823897932, "3": 0.005300283337220834, "2": 1.1891187243210739e-05, "1": 4.0254336772151605e-07}, "score": 4.301804813510633}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6184584920948967, "5": 0.36694694698542196, "3": 0.014549107899405141, "2": 4.466644541898708e-05, "1": 7.585500915966705e-07}, "score": 4.352306240418203}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8912067551514868, "4": 0.108295410882046, "3": 0.0004956492691573612, "2": 1.9886470993564672e-06, "1": 1.3669891914696972e-07}, "score": 4.89070677135597}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9329531535058968, "4": 0.06687444318541709, "3": 0.00017130310957446174, "2": 9.031492633621199e-07, "1": 1.0816543243475392e-07}, "score": 4.932779802511087}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6816232453194991, "5": 0.3158641066931932, "3": 0.002511794603102703, "2": 8.229042382213743e-07, "1": 4.579311887581494e-08}, "score": 4.313350524103873}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8909823151721021, "4": 0.10836689860846818, "3": 0.0006489105358447091, "2": 1.7100430710814187e-06, "1": 1.5322904635404758e-07}, "score": 4.890329535913272}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7913826052435543, "4": 0.20803428107508104, "3": 0.0005826140486589064, "2": 4.3756218679681046e-07, "1": 1.5550189685051102e-08}, "score": 4.790799106208188}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9785139066836887, "4": 0.021451225550903723, "3": 3.4586677271777103e-05, "2": 2.307696061751595e-07, "1": 5.510446993669358e-08}, "score": 4.9784786884708545}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9938614289884236, "4": 0.006135939959025581, "3": 2.647499363199153e-06, "2": 5.156106997749189e-09, "1": 0}, "score": 4.993858749706596}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8438714891667172, "5": 0.12307889579621586, "3": 0.03296022656586965, "2": 8.771444174695039e-05, "1": 1.58656381971069e-06}, "score": 4.08993848852192}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8843454828413516, "4": 0.11542882185301664, "3": 0.0002247151405203601, "2": 8.644918147997902e-07, "1": 8.635449311063666e-08}, "score": 4.88411880557503}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7672049295926208, "5": 0.22022165876862468, "3": 0.012558142738683772, "2": 1.5024625544749816e-05, "1": 1.4986439276223554e-07}, "score": 4.2076330367883354}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9803321589890621, "4": 0.019628446753173136, "3": 3.921657770215182e-05, "2": 1.62648728736968e-07, "1": 0}, "score": 4.98029263184901}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.992239346089312, "4": 0.00774845817941961, "3": 1.2135299966171961e-05, "2": 6.839090424736977e-08, "1": 1.7967109509126424e-08}, "score": 4.992226994381026}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7773666973358034, "4": 0.22187637978999164, "3": 0.0007534916662590212, "2": 3.1225237153110617e-06, "1": 2.0804488234865115e-07}, "score": 4.77660641464463}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.961033453003629, "4": 0.03890315213082021, "3": 6.268251605556159e-05, "2": 4.752104872560392e-07, "1": 1.3483594765781513e-07}, "score": 4.960969513868878}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8084202696332531, "5": 0.18902240990982866, "3": 0.0025558319292712833, "2": 1.422158172997703e-06, "1": 4.683003810797304e-08}, "score": 4.186463596817491}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6171628262334878, "4": 0.38228674905400767, "3": 0.0005486086018196151, "2": 1.6126963955549258e-06, "1": 1.330853746502788e-07}, "score": 4.616610636348309}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9700048281721834, "5": 0.022210176371993826, "3": 0.007756826380684213, "2": 2.7510989910904403e-05, "1": 3.5994773377312855e-07}, "score": 4.014397252460648}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5732878456344122, "4": 0.4263223622429405, "3": 0.00038932480050325263, "2": 3.5387927961826753e-07, "1": 3.690912597802378e-08}, "score": 4.572897746193978}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7116742971886935, "5": 0.2868412649579423, "3": 0.0014830759550154978, "2": 1.3066264125846105e-06, "1": 8.325247323488509e-08}, "score": 4.285355318008286}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5623922605776007, "4": 0.436204093849823, "3": 0.0014031648311219383, "2": 3.466161032939303e-07, "1": 0}, "score": 4.560988477757049}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9954591713782643, "4": 0.0045358603503068695, "3": 4.974727314558119e-06, "2": 2.2493825221502302e-08, "1": 1.0872175694000377e-08}, "score": 4.995454079405912}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6957388531836414, "4": 0.3040571201487078, "3": 0.0002036289689021192, "2": 3.056653380459997e-07, "1": 0}, "score": 4.695534676896491}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7974256240911157, "5": 0.16057663078201292, "3": 0.04192952694000018, "2": 6.579261236660237e-05, "1": 2.307942783816134e-06}, "score": 4.118508608729299}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.55293529032159, "3": 0.43809916067230076, "5": 0.0068187759684603, "2": 0.002133555803139596, "1": 1.3120377526193636e-05}, "score": 3.5644131003676693}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6556322118042409, "4": 0.3436707506995727, "3": 0.0006961621156278186, "2": 7.695299215638497e-07, "1": 8.588196357725651e-08}, "score": 4.654934266061048}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8827559799220364, "3": 0.11360258700761823, "5": 0.0024360768061824183, "2": 0.0011929351453514648, "1": 1.2180831869819364e-05}, "score": 3.88641104971831}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8707963684421878, "3": 0.10479250781139882, "5": 0.0237164115505683, "2": 0.0006846847805461204, "1": 9.824168842211301e-06}, "score": 3.9175250449088086}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5073003725660724, "5": 0.4912068287831564, "3": 0.0014912672755634552, "2": 1.3400026049644813e-06, "1": 4.9629520941146746e-08}, "score": 4.489712802027222}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.912246919944125, "5": 0.07304133976276116, "3": 0.0146961900362233, "2": 1.5086428396176796e-05, "1": 2.5464714376378124e-07}, "score": 4.058314225126562}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9641226549885846, "3": 0.02160915957023574, "5": 0.014262850345413998, "2": 5.036279212554974e-06, "1": 8.235571366778508e-08}, "score": 3.9926433695571895}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.827261426205159, "4": 0.17251796551857052, "3": 0.00022038776388276117, "2": 1.8832794603520884e-07, "1": 2.3787228926905057e-08}, "score": 4.827040597368533}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9349630585931638, "5": 0.03338165437877899, "3": 0.03163515110124622, "2": 1.9669821506640096e-05, "1": 2.0890045297588587e-07}, "score": 4.00170653737209}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6559699821517725, "3": 0.3038662322223369, "5": 0.03773251837311677, "2": 0.0024108249190143483, "1": 1.9891083340308897e-05}, "score": 3.728984813665496}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8653915893838672, "4": 0.134359464474091, "3": 0.0002483379593925389, "2": 5.121972664885956e-07, "1": 6.454120370304493e-08}, "score": 4.8651420606100135}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9105567257480623, "4": 0.0892896945798818, "3": 0.0001534263362898716, "2": 8.172793269998933e-08, "1": 0}, "score": 4.910403201147908}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8872264948012777, "4": 0.11267413357826248, "3": 9.893673030120502e-05, "2": 3.58741056428271e-07, "1": 0}, "score": 4.887126908142782}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9875266443012205, "4": 0.012450107768555606, "3": 2.311529588600799e-05, "2": 7.45957725181449e-08, "1": 0}, "score": 4.987503437127073}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9229319169355021, "4": 0.07674566317304599, "3": 0.0003194694202483724, "2": 2.276771789736692e-06, "1": 4.769133589392831e-07}, "score": 4.922606644787718}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8263208604340437, "4": 0.17278521286011644, "3": 0.0008914644482782464, "2": 2.2214042877801644e-06, "1": 2.369482675541837e-07}, "score": 4.8254242455556735}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.566480511893436, "4": 0.4327892889600436, "3": 0.0007284877120053226, "2": 1.2508265314538792e-06, "1": 7.231943018302009e-08}, "score": 4.565749525244141}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9689193622949565, "4": 0.03101142481415377, "3": 6.855792840003907e-05, "2": 4.6901738544878626e-07, "1": 7.335259167420156e-08}, "score": 4.968849755359239}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9690063305862174, "4": 0.03094837454408988, "3": 4.488495039113355e-05, "2": 2.1494600067839157e-07, "1": 6.555082768781631e-08}, "score": 4.968960944496664}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "human", "scores": {"5": 0.753587381616223, "4": 0.24466704321769867, "3": 0.0017449297186222766, "2": 6.221230090586621e-07, "1": 1.6565510229645578e-08}, "score": 4.751841163036699}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8777439733309031, "5": 0.11633003480052746, "3": 0.00592180131610382, "2": 4.153660767100345e-06, "1": 2.5593485256882516e-08}, "score": 4.110399850629754}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9846674835060236, "4": 0.015323734163756444, "3": 8.73566925223089e-06, "2": 1.3233041381713419e-08, "1": 0}, "score": 4.984658754285789}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5792632740537369, "5": 0.419877322355907, "3": 0.000857743546506884, "2": 1.5383871431400844e-06, "1": 3.74380601092759e-08}, "score": 4.4190164250099295}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9424764186245311, "4": 0.057495925187173155, "3": 2.751250305696063e-05, "2": 4.8417234591808624e-08, "1": 0}, "score": 4.942448899072231}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7891605448010305, "5": 0.20443232241674242, "3": 0.006395114113086871, "2": 1.1399067547364241e-05, "1": 4.4476623829703915e-07}, "score": 4.198013110489538}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7125436325839708, "5": 0.28404613694030423, "3": 0.003401017933374304, "2": 8.600458862702511e-06, "1": 3.68550165593648e-07}, "score": 4.280626880780703}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8486022455800973, "4": 0.15033072178753487, "3": 0.0010647193879841858, "2": 2.143445450566231e-06, "1": 2.313116272133299e-07}, "score": 4.8475324932323245}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6372342000447125, "5": 0.3595661906973894, "3": 0.0031888306397503162, "2": 1.0070940090803031e-05, "1": 4.77995747948381e-07}, "score": 4.356355866038853}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.753834704355649, "3": 0.24288441675827965, "5": 0.002322843261313365, "2": 0.0009535382675107319, "1": 4.230658090739334e-06}, "score": 3.7575185933241535}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6253890142940689, "3": 0.36603797285228584, "5": 0.008166347765373021, "2": 0.00040537438923686215, "1": 1.174727913689978e-06}, "score": 3.6413140603536616}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8734269342639491, "5": 0.10940209929611326, "3": 0.01715243728026993, "2": 1.8232077778258776e-05, "1": 3.5228265021563315e-07}, "score": 4.092212135922155}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9677548634634391, "4": 0.03215124835403262, "3": 9.357643209902003e-05, "2": 2.5325169521498567e-07, "1": 2.3055280610746625e-08}, "score": 4.967660745659346}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8352842357158553, "4": 0.1639754102335515, "3": 0.0007380647500628147, "2": 2.0171236438568505e-06, "1": 2.351876807634782e-07}, "score": 4.834541462024488}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9039459266786035, "4": 0.09557041245272596, "3": 0.000482316316913939, "2": 1.0561461316603766e-06, "1": 1.8179448339961188e-07}, "score": 4.90346104900499}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9264512426053362, "4": 0.07290808068145549, "3": 0.0006344294924466346, "2": 5.810243950174986e-06, "1": 4.1577108690635314e-07}, "score": 4.925803964944073}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9080642163764827, "3": 0.05840689681345202, "5": 0.03322096255670083, "2": 0.0003041982289950641, "1": 3.481459345243276e-06}, "score": 3.974195218596276}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6685049886598469, "5": 0.32389123953196564, "3": 0.007590073529047363, "2": 1.2961747994711072e-05, "1": 4.695965101488813e-07}, "score": 4.316273918141861}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6707198636624704, "5": 0.32467876527325695, "3": 0.004587362678001979, "2": 1.3219004882663425e-05, "1": 6.386904044852632e-07}, "score": 4.3200630967448985}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8050109412830312, "5": 0.16585333587229625, "3": 0.029063772838501638, "2": 6.908941656944149e-05, "1": 2.7026034737686735e-06}, "score": 4.1366432979779795}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8749061373312177, "5": 0.1023576833830199, "3": 0.022667660904551884, "2": 6.713057195095038e-05, "1": 1.0044986466294457e-06}, "score": 4.079552778332051}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9774624032604013, "4": 0.022515673776603386, "3": 2.185984862474328e-05, "2": 2.1074711971175978e-08, "1": 5.887561098459831e-09}, "score": 4.977440518936195}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7305627875597925, "4": 0.2683666597815352, "3": 0.0010689322777232648, "2": 1.3506751221986593e-06, "1": 1.1263267239096463e-07}, "score": 4.729490930617248}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.914531116530157, "4": 0.08543211457403352, "3": 3.679700875222626e-05, "2": 2.4515653623799778e-08, "1": 0}, "score": 4.914494222361549}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6711702489334995, "4": 0.32851657030528786, "3": 0.00031283145340016937, "2": 2.971113062004934e-07, "1": 1.6931331441119232e-08}, "score": 4.670856796121375}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8636129630281958, "5": 0.12415235477885293, "3": 0.012211957308259908, "2": 2.180500559668013e-05, "1": 6.621153840825597e-07}, "score": 4.111894829955674}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9352619252185953, "4": 0.06468180746084654, "3": 5.608528944797752e-05, "2": 7.82705830455504e-08, "1": 3.060440145295358e-08}, "score": 4.9352056599908}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.847977395326604, "4": 0.15169276296424594, "3": 0.00032955196757279405, "2": 2.411101388923416e-07, "1": 4.516262376676578e-08}, "score": 4.847647228591213}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.98455745207825, "4": 0.015436425040847006, "3": 6.071128839011895e-06, "2": 1.3221612971743664e-08, "1": 8.754070891734687e-09}, "score": 4.984551357560348}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9779068097906458, "4": 0.022057546295829813, "3": 3.5482497898477984e-05, "2": 7.999473635497234e-08, "1": 4.5927030198314866e-08}, "score": 4.977871064230602}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8502101625501783, "5": 0.1037942297367772, "3": 0.04594996003180865, "2": 4.530632094498659e-05, "1": 2.5772569894186017e-07}, "score": 4.057752888716121}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9679721720509871, "4": 0.03199376304572236, "3": 3.384951116234254e-05, "2": 1.0826639787626989e-07, "1": 1.7312223919743964e-08}, "score": 4.967938141004276}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6465263006529122, "4": 0.35321466172542754, "3": 0.0002589312436605031, "2": 1.1762526336747688e-07, "1": 8.226435719217965e-09}, "score": 4.646267096894206}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9966662553080478, "4": 0.0033294571709645408, "3": 4.204679442107118e-06, "2": 3.230780483979786e-08, "1": 1.021864340723047e-08}, "score": 4.996661995537591}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6060577199538351, "4": 0.39314210190994864, "3": 0.0007973504216151042, "2": 2.7701890250583755e-06, "1": 4.677813238275577e-08}, "score": 4.605254695324714}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6023215440133225, "5": 0.3965581461933323, "3": 0.001119278945123022, "2": 9.523292605778315e-07, "1": 4.277123669992305e-08}, "score": 4.395436848411946}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9025332295562607, "4": 0.09740797430211426, "3": 5.86826174615546e-05, "2": 5.4261330998694254e-08, "1": 0}, "score": 4.902474491899332}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5319540316748405, "5": 0.46474201212252275, "3": 0.003301620072223733, "2": 2.173627776251649e-06, "1": 7.784400100632764e-08}, "score": 4.461435850327272}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9823596915690497, "4": 0.017619278625080902, "3": 2.0982181089184263e-05, "2": 8.25187744834023e-08, "1": 0}, "score": 4.982338510072697}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6649056420819097, "5": 0.3331235955686236, "3": 0.0019693199477829634, "2": 1.3999276517497328e-06, "1": 3.5515806004193994e-08}, "score": 4.331151371522345}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8512822813046249, "3": 0.1398545395115578, "5": 0.008664105435313324, "2": 0.00019809219585758617, "1": 8.337101808145923e-07}, "score": 3.8684108609470353}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8534246023645974, "3": 0.1391215037473185, "5": 0.005373713943084858, "2": 0.0020729729382572082, "1": 6.952585174474943e-06}, "score": 3.8620853714752723}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8759516269037139, "4": 0.12384315413855318, "3": 0.0002049261269728039, "2": 2.3728046472681002e-07, "1": 3.451047278459605e-08}, "score": 4.875746141109937}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9087639540855263, "4": 0.09110212946153572, "3": 0.00013365696540195023, "2": 2.002332299645846e-07, "1": 3.383547596916509e-08}, "score": 4.908629818243543}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9959592299704069, "4": 0.004036412405385474, "3": 4.301232278175599e-06, "2": 2.8034890870352096e-08, "1": 1.3842905137579596e-08}, "score": 4.995954845595054}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9465337654117156, "4": 0.053401822734161296, "3": 6.414310212268533e-05, "2": 1.2637590479841888e-07, "1": 1.6244913379053696e-08}, "score": 4.946469440202352}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9771405153454694, "4": 0.022853036090203446, "3": 6.351319318165096e-06, "2": 1.8817133984740915e-08, "1": 0}, "score": 4.977134203026442}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9637939827994003, "4": 0.03602189251293561, "3": 0.00018395102578412157, "2": 1.0282780950836866e-07, "1": 6.641871903569137e-09}, "score": 4.963609868048616}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982482980239393, "4": 0.0017501172382586635, "3": 1.503768901741293e-06, "1": 0, "2": 0}, "score": 4.998246875081988}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8795078230153711, "4": 0.12041176920652062, "3": 8.030537522192673e-05, "2": 7.072052464654196e-08, "1": 0}, "score": 4.8794274040614365}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.856844383259792, "5": 0.13922362857178383, "3": 0.003930502494808877, "2": 1.405811980566285e-06, "1": 2.8625955377379012e-08}, "score": 4.135290235506835}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5170264733906793, "4": 0.482337332384628, "3": 0.0006352080340803201, "2": 9.247818177121113e-07, "1": 4.022697686870911e-08}, "score": 4.5163893060500975}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5867148454874417, "4": 0.4125165924067507, "3": 0.000768118914664383, "2": 3.8600172445174194e-07, "1": 0}, "score": 4.5859459880792395}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5698361019157049, "4": 0.4293234162711712, "3": 0.0008391316087272833, "2": 1.289204753295775e-06, "1": 6.8725673707268e-08}, "score": 4.568994181324384}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8293001472214782, "5": 0.16904005167119762, "3": 0.0016580074979390118, "2": 1.6115550106048239e-06, "1": 5.100664084765021e-08}, "score": 4.167378689977913}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8845089471008933, "4": 0.11486763655394179, "3": 0.0006202989616094899, "2": 2.687865967037246e-06, "1": 2.412242109639557e-07}, "score": 4.883882715163978}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5816435359962349, "4": 0.416775884042413, "3": 0.0015790798105328732, "2": 1.203791980109768e-06, "1": 5.010089323362781e-08}, "score": 4.580062041143949}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8574700822972193, "3": 0.08725923310024516, "5": 0.0551775009650404, "2": 9.271094716221879e-05, "1": 3.371344583385704e-07}, "score": 3.9677318301929554}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8099688247656294, "4": 0.1899031829716991, "3": 0.00012787644930413922, "2": 6.258582638821155e-08, "1": 0}, "score": 4.809840866250511}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9971787828339619, "4": 0.0028197219448797364, "3": 1.5049949729523668e-06, "2": 5.91301490141571e-09, "1": 0}, "score": 4.997177250370409}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8876777020619635, "5": 0.09990765196647121, "3": 0.012411572195471933, "2": 3.0195764039743614e-06, "1": 4.622310757213325e-08}, "score": 4.087489902646738}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9543255598925768, "4": 0.04555920910363261, "3": 0.00011462862534663872, "2": 4.964798194036165e-07, "1": 9.947514728611841e-08}, "score": 4.954209646011494}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8917735913292416, "4": 0.1079988608066633, "3": 0.00022739817549703798, "2": 8.461857768975616e-08, "1": 0}, "score": 4.891546081929511}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7299342626930174, "4": 0.2695058181994197, "3": 0.0005588038728223444, "2": 1.0350405016330196e-06, "1": 6.434799893300403e-08}, "score": 4.729373207253018}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9660844144775415, "4": 0.03387969539300718, "3": 3.5835555035354874e-05, "2": 4.4669003940790434e-08, "1": 1.4430843662499681e-08}, "score": 4.96604844192018}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9956443116462204, "4": 0.004349162418032261, "3": 6.496253057290313e-06, "2": 1.6756627253525566e-08, "1": 0}, "score": 4.995637794749586}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9242224033841204, "5": 0.057046736985873425, "3": 0.018431207339090795, "2": 0.0002960192713048126, "1": 3.440069098525621e-06}, "score": 4.038013178231541}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8620193851484675, "4": 0.13598370725747733, "3": 0.001988927957955111, "2": 7.403349685286568e-06, "1": 4.4945055009432805e-07}, "score": 4.860014411220162}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8559420959899211, "4": 0.143870527274905, "3": 0.00018692669935753466, "2": 2.9434979438839656e-07, "1": 3.5507815846769454e-08}, "score": 4.855754576910578}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9833570529138475, "4": 0.01662610879879248, "3": 1.6743708201850322e-05, "2": 3.471739426298121e-08, "1": 1.2001754374131311e-08}, "score": 4.9833402508282685}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8070521021765946, "5": 0.15760609948362628, "3": 0.03494221786159919, "2": 0.0003915699056422121, "1": 7.923947932581097e-06}, "score": 4.121856980522758}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6554823120813782, "5": 0.3376167846267201, "3": 0.006885051959924523, "2": 1.5176353989360211e-05, "1": 4.671380559248289e-07}, "score": 4.330700047277324}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9184467141500319, "3": 0.05521195903385989, "5": 0.026276812044788028, "2": 6.380812657126322e-05, "1": 4.253225562504326e-07}, "score": 3.970935952613755}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9892896496542181, "4": 0.010699027815570975, "3": 1.1163902229355899e-05, "2": 4.635308446034276e-08, "1": 0}, "score": 4.989278504116963}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8103376875367829, "4": 0.1894302492601045, "3": 0.00023042929241636124, "2": 1.2994570949411989e-06, "1": 1.0520847279600334e-07}, "score": 4.810104529417275}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9190973884895812, "5": 0.07124087059806214, "3": 0.009650235111905566, "2": 1.1272144095043916e-05, "1": 1.3687674330251814e-07}, "score": 4.061567686526233}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7483436136135749, "3": 0.23644167944542452, "2": 0.008551855517398833, "5": 0.0066191322346792585, "1": 4.3571643397060076e-05}, "score": 3.75294299037211}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5174487616753051, "5": 0.478004486763603, "3": 0.004531653477568266, "2": 1.4373360930614636e-05, "1": 5.015201755223501e-07}, "score": 4.4734426876772}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9849367480988489, "4": 0.015061708753485316, "3": 1.5263916601584294e-06, "1": 0, "2": 0}, "score": 4.984935238210769}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8864340002872241, "5": 0.10791757906671255, "3": 0.0056372737950778195, "2": 1.088941871841557e-05, "1": 1.7433815573017699e-07}, "score": 4.102258011916771}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5817163041541414, "5": 0.41533759812367904, "3": 0.0029367786371532487, "2": 8.937032133622351e-06, "1": 3.879571273301935e-07}, "score": 4.412381779116078}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5297181268728012, "5": 0.466506399814994, "3": 0.003767841454441542, "2": 6.6576099778706614e-06, "1": 6.650284601422107e-07}, "score": 4.462723391138231}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5451167647602757, "4": 0.4523454143298169, "3": 0.002535267816461417, "2": 2.2184872794402112e-06, "1": 1.0537514969840154e-07}, "score": 4.542576868219253}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9034939998311167, "4": 0.09638059445150103, "3": 0.00012512391396086564, "2": 1.6562543728468335e-07, "1": 2.226439658599299e-08}, "score": 4.903368562711674}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6658344985492227, "4": 0.33330273096088037, "3": 0.0008617299667577316, "2": 9.352527718215131e-07, "1": 6.768975485609284e-08}, "score": 4.664970719997664}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8740801960865224, "5": 0.11777023661532234, "3": 0.008140201866100004, "2": 8.991256075972714e-06, "1": 1.7580981900224126e-07}, "score": 4.109611546550834}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9987906171935388, "4": 0.0012089476603184932, "3": 3.7728498752267554e-07, "1": 2.09091095979716e-09, "2": 0}, "score": 4.998790289338596}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7862109172445775, "4": 0.21306825896204235, "3": 0.0007188884200336964, "2": 1.4115191813607524e-06, "1": 3.307467037458331e-07}, "score": 4.785488365229734}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9387398577094745, "4": 0.061218833492473035, "3": 4.120573962604258e-05, "2": 6.50746346742563e-08, "1": 0}, "score": 4.9386985574759095}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9084795291326947, "4": 0.0914079156304577, "3": 0.00011215575310588928, "2": 2.197962183684521e-07, "1": 4.0912630802344764e-08}, "score": 4.908366937107783}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9335604516836193, "4": 0.06631266330188976, "3": 0.00012628667966563828, "2": 4.0703771090901276e-07, "1": 6.138397680121346e-08}, "score": 4.93343328804185}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6661275102069923, "4": 0.33192458150928067, "3": 0.0019364110373153657, "2": 1.0389218211558138e-05, "1": 7.70944076296639e-07}, "score": 4.664168231781591}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9240157518768419, "3": 0.04542360387044841, "5": 0.03051417345095241, "2": 4.5996327574460746e-05, "1": 3.000322104161243e-07}, "score": 3.984997674211688}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9239665863067461, "4": 0.07586708889604193, "3": 0.00016505859927372775, "2": 9.592760035281589e-07, "1": 2.0827260799315564e-07}, "score": 4.923799075469797}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6045969749741644, "4": 0.393573359614873, "3": 0.0018204484630094657, "2": 8.696847102488774e-06, "1": 5.101117589696759e-07}, "score": 4.602757608502676}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7263125551990581, "5": 0.2716517673564671, "3": 0.0020335208081331195, "2": 1.962231915868594e-06, "1": 1.247093508878547e-07}, "score": 4.269613966747216}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9795206613967028, "4": 0.02045532580166847, "3": 2.392396217096961e-05, "2": 4.892369487768254e-08, "1": 0}, "score": 4.979496678684499}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8484994012204271, "5": 0.14221993237821262, "3": 0.009266189880703353, "2": 1.388260417231982e-05, "1": 0}, "score": 4.1329260562361405}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9825540343078444, "4": 0.017440887029699936, "3": 5.095086061847285e-06, "2": 2.3851708188916822e-08, "1": 0}, "score": 4.982548851945903}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6028730711605912, "4": 0.39668663201515897, "3": 0.0004393770630459304, "2": 7.791026720134204e-07, "1": 5.342986380586029e-08}, "score": 4.602432028151953}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "human", "scores": {"2": 0.7589851628991803, "3": 0.2062198182980583, "4": 0.023892492278517218, "1": 0.010155579704055851, "5": 0.0007466913084048044}, "score": 2.246089359954983}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.882717245439478, "4": 0.11698001157719033, "3": 0.0003013916428279094, "2": 1.1614910387553722e-06, "1": 1.1249050712200035e-07}, "score": 4.882413261605622}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8001142252052151, "5": 0.19588727749794074, "3": 0.0039924987139165705, "2": 5.90302279569289e-06, "1": 7.323165969425892e-08}, "score": 4.191882757327902}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9872787450071974, "4": 0.012709312328557458, "3": 1.1751954391665895e-05, "2": 8.26870365437518e-08, "1": 3.688392565187173e-08}, "score": 4.98726678726002}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7555700360330129, "4": 0.24394694886819568, "3": 0.00048156208222055696, "2": 1.3233541785558884e-06, "1": 4.813915296448605e-08}, "score": 4.755085744382012}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.648459259413599, "4": 0.34966140745868235, "3": 0.0018699596984105397, "2": 9.110645436231075e-06, "1": 2.492159617794227e-07}, "score": 4.646570339549039}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9604381753477953, "4": 0.0395332851456538, "3": 2.835667799925736e-05, "2": 4.4731986928437845e-08, "1": 8.16426608541442e-09}, "score": 4.960409829501281}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7647617129633196, "4": 0.23498509320973718, "3": 0.0002528856873495462, "2": 2.4290728733722203e-07, "1": 2.1412927682475394e-08}, "score": 4.764508310722891}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9561159563815801, "4": 0.04386475626049669, "3": 1.925778814672246e-05, "2": 2.378318544169353e-08, "1": 0}, "score": 4.956096656559604}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9815673580094115, "4": 0.01841662296861659, "3": 1.6017719175891375e-05, "2": 3.071281017014774e-08, "1": 0}, "score": 4.981551249997179}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6710160652813323, "4": 0.3263566099275003, "3": 0.002613623516435485, "2": 1.1429783748246575e-05, "1": 2.2504913225690384e-06}, "score": 4.668372844759037}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7592438615312944, "5": 0.23075431635737964, "3": 0.00995363965724715, "2": 4.23511492618776e-05, "1": 5.249010370428639e-06}, "score": 4.220700355883089}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7951932993865782, "5": 0.19711905355759402, "3": 0.007656896760225263, "2": 2.9321075505056708e-05, "1": 1.091222424234599e-06}, "score": 4.1894003049959485}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.49960271320043226, "4": 0.49647743235212016, "3": 0.003909264617653856, "2": 1.0025918179380688e-05, "1": 5.925141988028753e-07}, "score": 4.495671605026335}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8525026852295856, "4": 0.14632135710959226, "3": 0.001174220213245183, "2": 1.3770775799111866e-06, "1": 2.0099033793858925e-07}, "score": 4.851325243574094}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8233275848633055, "5": 0.16354588268020803, "3": 0.013108054374004894, "2": 1.7767208832955256e-05, "1": 5.919557212769435e-07}, "score": 4.150400535906693}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7534788351721464, "4": 0.24572329333017442, "3": 0.0007970721151641364, "2": 7.151468004585976e-07, "1": 5.867330403591789e-08}, "score": 4.752680175983788}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8947883492126927, "5": 0.09561826697818816, "3": 0.009589476305231909, "2": 3.7682607593329263e-06, "1": 7.916694391988821e-08}, "score": 4.086021021818421}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6913687988554111, "4": 0.3079303678429882, "3": 0.0006993984146962945, "2": 1.2978597452858458e-06, "1": 6.311230995348852e-08}, "score": 4.690666666434818}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6355525823983558, "4": 0.36386200149511155, "3": 0.0005849193988315797, "2": 4.1530609926920747e-07, "1": 2.8076778223549944e-08}, "score": 4.634966782016483}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7736651513459021, "5": 0.22079798290830013, "3": 0.005531165644700183, "2": 5.540244082292904e-06, "1": 7.385308906011635e-08}, "score": 4.215255533728989}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9416068577317361, "4": 0.05828506461538955, "3": 0.00010785573616871255, "2": 2.1649811418580025e-07, "1": 2.740813417248266e-08}, "score": 4.941498466071817}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5687716178686117, "4": 0.42978197231983806, "3": 0.0014456192536210664, "2": 7.758016151711557e-07, "1": 3.182804555962241e-08}, "score": 4.567324341842416}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9620064072457433, "4": 0.037969031957258335, "3": 2.446803466100078e-05, "2": 4.820023212644997e-08, "1": 8.451980874773515e-09}, "score": 4.96198185219196}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8982860142488828, "4": 0.10159125707011285, "3": 0.0001225526284793808, "2": 1.3462899861976183e-07, "1": 1.3067351101148016e-08}, "score": 4.898163178628826}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "human", "scores": {"5": 0.524806476781631, "4": 0.4745556103557584, "3": 0.0006375841433964941, "2": 2.728938350490807e-07, "1": 1.663681210725513e-08}, "score": 4.524168317481532}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.978435843958177, "4": 0.021546734612838462, "3": 1.739690919488816e-05, "2": 2.425565623394736e-08, "1": 8.72211572012802e-09}, "score": 4.9784183640958775}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7732498201551837, "4": 0.22639412106899437, "3": 0.0003559412033079022, "2": 1.0263713809173014e-07, "1": 1.080987249999405e-08}, "score": 4.7728936444365555}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9974468648078358, "4": 0.002551369513146566, "3": 1.7679126519057068e-06, "2": 5.959561097141669e-09, "1": 5.632012492300505e-09}, "score": 4.9974450542901385}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9841945185628295, "4": 0.015790250284766917, "3": 1.5165476443615993e-05, "2": 5.566484713107982e-08, "1": 1.2306453959830464e-08}, "score": 4.984179202578304}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6575533812584655, "4": 0.32200934890266336, "2": 0.01937039324527155, "5": 0.0010168510833720803, "1": 4.9883563412442165e-05}, "score": 3.304572933930469}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9791879277370329, "4": 0.020788623271748925, "3": 2.343980294673632e-05, "2": 4.808055516947683e-08, "1": 1.2433790875546899e-08}, "score": 4.979164304214944}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7123950328557841, "4": 0.28738704008612853, "3": 0.0002176793390133506, "2": 1.241521509164184e-07, "1": 0}, "score": 4.712177193214012}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7497191719282343, "5": 0.2488766467112195, "3": 0.00140281548657419, "2": 1.323794928878205e-06, "1": 4.1358246652189764e-08}, "score": 4.247471059738424}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9830478790017599, "4": 0.01693289668021106, "3": 1.9215102492073918e-05, "2": 2.7371815071455543e-08, "1": 0}, "score": 4.983028591307498}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8480681761657314, "5": 0.13971183486815003, "3": 0.012190637986304905, "2": 2.844315567921425e-05, "1": 7.191995352451991e-07}, "score": 4.127462177014382}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5878953224357205, "4": 0.4111457353955626, "3": 0.0009584332863880253, "2": 4.868153226766696e-07, "1": 2.6391654346770816e-08}, "score": 4.586935833805432}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8975397947934002, "4": 0.10220254493560672, "3": 0.00025677123645391454, "2": 7.114647242893455e-07, "1": 1.6626848094661494e-07}, "score": 4.897281111962528}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9477511833478292, "4": 0.052142376098798945, "3": 0.0001060793668662441, "2": 2.3141111260085697e-07, "1": 3.121403511034003e-08}, "score": 4.947644640917776}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6922930710103895, "4": 0.30637519520194867, "3": 0.001325819791898256, "2": 5.141765782712442e-06, "1": 5.389074433419548e-07}, "score": 4.690955512180089}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5397960478138342, "4": 0.45552069487461166, "3": 0.004675820142860039, "2": 7.171125085301707e-06, "1": 2.1846675172663769e-07}, "score": 4.535105255479174}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9975274032157255, "4": 0.0024676623339148977, "3": 4.890108825605866e-06, "2": 2.9304346125358004e-08, "1": 1.415964244583501e-08}, "score": 4.997522412894651}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.524095452495231, "5": 0.4718760187692436, "3": 0.0040251785856109555, "2": 3.1670310063731955e-06, "1": 9.24276186336298e-08}, "score": 4.467844271268165}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9957073055654204, "4": 0.004287227608729291, "3": 5.474607359462676e-06, "2": 2.9228166103705693e-08, "1": 1.557069834729554e-08}, "score": 4.995701673435268}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6788223638566518, "5": 0.31857052497138544, "3": 0.002601225236884907, "2": 5.467276298508802e-06, "1": 2.6013528872797787e-07}, "score": 4.3159576348627455}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5472154929144233, "5": 0.4468611495625905, "3": 0.005909372672400775, "2": 1.3247178123832242e-05, "1": 6.993538497372958e-07}, "score": 4.440923201367958}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7763204445725895, "5": 0.21569239144331603, "3": 0.007970808885899383, "2": 1.5933145434791832e-05, "1": 3.9783081896922254e-07}, "score": 4.20768852778394}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.5813393578272915, "4": 0.40859914055109814, "5": 0.007768661457771006, "2": 0.0022863079760551764, "1": 6.497961796533744e-06}, "score": 3.4218371740047857}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5092099510358252, "4": 0.4867745984012753, "3": 0.004007372457253, "2": 7.640114255418189e-06, "1": 3.6051509813597177e-07}, "score": 4.505186255944726}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5965031837939418, "3": 0.3803389500569076, "5": 0.019424506275774266, "2": 0.00372555554005806, "1": 7.784379191854893e-06}, "score": 3.631611084650296}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8922587678375177, "3": 0.09788126661529759, "5": 0.009815606107268936, "2": 4.3888817367586236e-05, "1": 3.514367798680447e-07}, "score": 3.911845497040134}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9629614318365515, "4": 0.036976977120353714, "3": 6.13626631373385e-05, "2": 1.3356047038191328e-07, "1": 2.3479878890155696e-08}, "score": 4.96289980030573}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8740436952596764, "5": 0.1195042312843727, "3": 0.006449915171283066, "2": 2.1435011808724367e-06, "1": 4.564585653323726e-08}, "score": 4.113049888684171}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7359842941139804, "4": 0.26393020124930155, "3": 8.543224092669834e-05, "2": 4.5668913512183736e-08, "1": 0}, "score": 4.735898790203504}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6352801730472345, "4": 0.3644727100075804, "3": 0.00024696251351496155, "2": 1.4536485697425318e-07, "1": 0}, "score": 4.635032925561731}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8847134249756357, "3": 0.07006936493041854, "5": 0.04509897319624397, "2": 0.00011714079155310531, "1": 1.116662759228376e-06}, "score": 3.9747919772126337}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7261378544646263, "5": 0.2535068334256533, "3": 0.02030428157802963, "2": 4.92388801300834e-05, "1": 1.4940066800678845e-06}, "score": 4.233099661448245}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9055459423043715, "5": 0.0857915982308782, "3": 0.008659759743824288, "2": 2.596326491211022e-06, "1": 6.899857394682803e-08}, "score": 4.077126441491179}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9383490196545222, "5": 0.04974187725321024, "3": 0.011898404065516037, "2": 1.0508248896917115e-05, "1": 6.630483608209881e-08}, "score": 4.037822262483243}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5838253086067344, "5": 0.4135860973955466, "3": 0.0025860553374556406, "2": 2.3889610348213876e-06, "1": 5.943764839427286e-08}, "score": 4.410995122920147}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "human", "scores": {"4": 0.914447382236585, "3": 0.043476444208786595, "5": 0.04202668522315365, "2": 4.9324433064450434e-05, "1": 2.2082506720041781e-07}, "score": 3.9984509297612196}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6621440424044592, "4": 0.33272917772449434, "3": 0.005100610706746527, "2": 2.4546948716053493e-05, "1": 1.3375807314971135e-06}, "score": 4.656990512060483}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5898248208403061, "4": 0.4077018628495359, "3": 0.0024719425004326445, "2": 1.247365288901523e-06, "1": 3.8686853401934025e-08}, "score": 4.58735031909318}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8758666724753521, "4": 0.1239582702819868, "3": 0.00017467560324565368, "2": 3.169391618316468e-07, "1": 1.7084144940710347e-08}, "score": 4.875691353438363}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9999989719621284, "5": 4.965781321404978e-07, "3": 4.7682990640377827e-07, "2": 3.3606343269926315e-08, "1": 1.1588066712763533e-08}, "score": 3.999999917771338}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7675855038946604, "3": 0.22920449102124255, "5": 0.002715127134470337, "2": 0.0004926887115910718, "1": 2.099534299438302e-06}, "score": 3.7725189396812464}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7581040148474912, "5": 0.23980528438423995, "3": 0.002089810263794242, "2": 8.095542899897763e-07, "1": 2.5915230263695364e-08}, "score": 4.237713790348743}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7274703767569304, "5": 0.2707336994728128, "3": 0.0017950584408415265, "2": 8.594080488390718e-07, "1": 3.029924627963664e-08}, "score": 4.268936824762025}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5940214198001709, "5": 0.4048742070493008, "3": 0.0011036235241702087, "2": 6.276287548352483e-07, "1": 0}, "score": 4.403769377526517}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8296521686028511, "4": 0.17011015179953715, "3": 0.00023721847642697773, "2": 4.2378821475722346e-07, "1": 0}, "score": 4.829414133514489}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9541486233430818, "3": 0.03590970448863819, "5": 0.00991639927388625, "2": 2.500754446555208e-05, "1": 1.5246176403129813e-07}, "score": 3.973956219370991}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5739672729813281, "4": 0.41926078252704824, "3": 0.006757229569002269, "2": 1.3932727345461498e-05, "1": 5.581974969498387e-07}, "score": 4.567180630412346}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.806445064233803, "4": 0.19298760788276223, "3": 0.0005665282563062756, "2": 6.172343891555228e-07, "1": 6.063376019898644e-08}, "score": 4.805877217730225}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6868803602726978, "4": 0.3117261191257716, "3": 0.0013890993381786457, "2": 4.257220821077496e-06, "1": 1.772955008685714e-07}, "score": 4.685482205521699}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5549226468468657, "5": 0.4425191228445521, "3": 0.0025482141461600485, "2": 9.634087185746171e-06, "1": 3.1161574334885994e-07}, "score": 4.439950736675496}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8156032137001976, "5": 0.14956434162129528, "3": 0.03456780919735197, "2": 0.00025923048202381994, "1": 5.462980707726502e-06}, "score": 4.114461675881104}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.926311192293149, "4": 0.07333384089693476, "3": 0.0003494528193883485, "2": 4.332975801157343e-06, "1": 7.812817474386326e-07}, "score": 4.925951099810107}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7812791239268411, "3": 0.21472086429243012, "5": 0.003761470528627531, "2": 0.0002381678216021433, "1": 3.7706019266563367e-07}, "score": 3.7885631401798667}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8357008791357581, "4": 0.1641727256838981, "3": 0.00012569188536760032, "2": 5.775291035862172e-07, "1": 8.496869010671057e-08}, "score": 4.835573811375171}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.753088747169606, "5": 0.2457024323081336, "3": 0.0012052544168619063, "2": 3.4858173762642185e-06, "1": 1.1535725024372384e-07}, "score": 4.244489851610697}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8917790935892745, "5": 0.08627142915148271, "3": 0.021945872459293934, "2": 3.5064234503269434e-06, "1": 3.8469773804074537e-08}, "score": 4.064318432289073}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5877062092969496, "5": 0.40813709657632113, "3": 0.00414874831946655, "2": 7.571646582249439e-06, "1": 2.6081565026748985e-07}, "score": 4.40397246830501}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8978387522493979, "5": 0.08392655565795641, "3": 0.018205236618380742, "2": 2.914614211195129e-05, "1": 2.4508836940162437e-07}, "score": 4.065662295708639}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9354219107765691, "4": 0.06454840961664854, "3": 2.9561787307330533e-05, "2": 3.6965492300832246e-08, "1": 0}, "score": 4.935392350688475}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9864717357193629, "4": 0.01351618665900723, "3": 1.2038027023398551e-05, "2": 2.129729005052589e-08, "1": 0}, "score": 4.9864596731473245}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9513084778043162, "3": 0.03200034163966083, "5": 0.01667824172129832, "2": 1.2822065551350211e-05, "1": 8.34715484733247e-08}, "score": 3.9846520050248384}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7636667851852615, "4": 0.23588534931187397, "3": 0.0004469622137149506, "2": 7.594176100437098e-07, "1": 7.869493829864664e-08}, "score": 4.763218117795473}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9625656243515104, "4": 0.03738085888843473, "3": 5.338338514600557e-05, "2": 5.9202207908513755e-08, "1": 7.777258023625974e-09}, "score": 4.962512163136596}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6329217640336352, "4": 0.3669167851860467, "3": 0.000161302834522886, "2": 1.588584949264124e-07, "1": 8.929146708348025e-09}, "score": 4.632760104139552}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.529429959164403, "4": 0.4696577082134239, "3": 0.0009113650750323575, "2": 7.961469958482701e-07, "1": 7.183938310915384e-08}, "score": 4.528516838896768}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7273155366188249, "5": 0.2610369789224856, "3": 0.011605025986591916, "2": 4.066710594627034e-05, "1": 1.8603089162950374e-06}, "score": 4.249345020606717}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9874344718785147, "4": 0.012530775757242577, "3": 3.421255075761631e-05, "2": 3.4314525344194345e-07, "1": 1.2673963157382434e-07}, "score": 4.987399261865803}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7909323100771082, "4": 0.2082342148182845, "3": 0.00083142205828718, "2": 1.9310590016754387e-06, "1": 1.0884902571694844e-07}, "score": 4.790096709734263}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7894706905826998, "4": 0.20975783087608046, "3": 0.0007668033331279517, "2": 4.239564526538928e-06, "1": 3.776567963211571e-07}, "score": 4.788694320883965}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7631658543167039, "4": 0.23625997293919773, "3": 0.0005711306302241706, "2": 2.718943968278947e-06, "1": 1.9894528495549074e-07}, "score": 4.762588783694992}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "human", "scores": {"4": 0.800487037244523, "5": 0.1919912463347909, "3": 0.007516615566297085, "2": 5.010053321049919e-06, "1": 7.133812071625064e-08}, "score": 4.184464400237709}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.753596326751532, "5": 0.23819214478444037, "3": 0.00820082352398821, "2": 1.0340792993466969e-05, "1": 1.360307328365389e-07}, "score": 4.22997028404224}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7816827353736059, "5": 0.20575976089320885, "3": 0.012545871897306975, "2": 1.1206994115142906e-05, "1": 2.3759910887287301e-07}, "score": 4.193190798383904}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7555999571988748, "4": 0.24317009526482533, "3": 0.0012280165157988873, "2": 1.7700902924429617e-06, "1": 1.3981048639238113e-07}, "score": 4.754367997003074}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5253371878402399, "4": 0.47061021339621323, "3": 0.004042403654276982, "2": 9.890053528085136e-06, "1": 1.565716663243468e-07}, "score": 4.521274611764887}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.800690042479488, "5": 0.13605468207164292, "3": 0.06303784617638024, "2": 0.00021369538319796296, "1": 3.772743886066459e-06}, "score": 4.072578124077216}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7743034251928941, "5": 0.22015808995233832, "3": 0.005533415627270826, "2": 4.820711628654047e-06, "1": 1.567954103790919e-07}, "score": 4.214614582200127}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7901810283197762, "4": 0.20923660207036848, "3": 0.0005817847639647681, "2": 5.181541769878168e-07, "1": 7.725632866949344e-08}, "score": 4.789597967136672}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9527058784337963, "4": 0.047156755659840725, "3": 0.00013689210461188808, "2": 4.090113216462719e-07, "1": 6.138581834814071e-08}, "score": 4.952567987392209}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8070381402959976, "4": 0.19257447826556068, "3": 0.0003864162506355652, "2": 7.601234368092106e-07, "1": 8.165065463394358e-08}, "score": 4.806650058398205}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5521325691696427, "5": 0.4461100538011463, "3": 0.0017509536440765406, "2": 6.14741432200471e-06, "1": 1.9821669212586814e-07}, "score": 4.4443462452281}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.758365689274689, "4": 0.24133274816454947, "3": 0.00030056305271282234, "2": 8.313532850527802e-07, "1": 5.163170061977956e-08}, "score": 4.758063396952174}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7031055754483297, "5": 0.29566512486974394, "3": 0.001226833769023177, "2": 2.3391124392797395e-06, "1": 6.209812758946182e-08}, "score": 4.294433445631991}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7176170921708183, "4": 0.2814004880329633, "3": 0.0009785085825865275, "2": 3.5662212362366947e-06, "1": 3.4552114308362195e-07}, "score": 4.716630414203415}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7496214898842555, "4": 0.24986680077664777, "3": 0.0005101037609992189, "2": 1.5453115769778238e-06, "1": 1.1643787127141167e-07}, "score": 4.749107904108086}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9539260884066089, "4": 0.045846918079406634, "3": 0.0002264201984151733, "2": 4.862806065173966e-07, "1": 3.6395379761102654e-08}, "score": 4.953698634755744}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7999773773712384, "4": 0.19955062808209795, "3": 0.00046095441625388766, "2": 1.0881853201727845e-05, "1": 1.541464056668922e-07}, "score": 4.799494200111916}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.716343685146672, "4": 0.2834046624573755, "3": 0.00025147235372838375, "2": 1.6610129896142068e-07, "1": 2.012582541646747e-08}, "score": 4.716091815783914}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5189502281153371, "5": 0.4777201873531792, "3": 0.003327517661402007, "2": 2.0589230564401464e-06, "1": 4.291132756766914e-08}, "score": 4.474388406525023}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9149470538734662, "3": 0.08154265674621282, "5": 0.0033466999774998114, "2": 0.00016302728149948778, "1": 5.715665000148347e-07}, "score": 3.9214762747104586}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6446941053192368, "3": 0.31384661490076193, "5": 0.039217453065852725, "2": 0.002231020890137118, "1": 1.0680189298613767e-05}, "score": 3.7208767207493474}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7940125593809213, "3": 0.18913052383063933, "5": 0.00858128508406606, "2": 0.008156660877031376, "1": 0.00011869813124329562}, "score": 3.802781291324862}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5092759845713679, "5": 0.4864404450292445, "3": 0.004267917395975324, "2": 1.5137340286367722e-05, "1": 3.8587127791558404e-07}, "score": 4.482141157916854}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5987658013748862, "4": 0.4000441951910008, "3": 0.001185090068630888, "2": 4.559033083565644e-06, "1": 2.392157434349585e-07}, "score": 4.597570944383226}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5873578968048204, "5": 0.41140341535959024, "3": 0.0012377562676386927, "2": 8.62634291388784e-07, "1": 3.5251526629063846e-08}, "score": 4.410163841883982}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9004667580852737, "3": 0.08214649510385096, "5": 0.01729239620189929, "2": 9.367478579217269e-05, "1": 7.082384543696025e-07}, "score": 3.9349564289195054}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9099146273237471, "4": 0.09004530917996315, "3": 3.9892668413000015e-05, "2": 1.599331374485343e-07, "1": 0}, "score": 4.909874424701904}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9881961436266803, "4": 0.011757781526656113, "3": 4.585450999394978e-05, "2": 1.115633774394396e-07, "1": 2.4692408221759705e-08}, "score": 4.988150074997239}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9673969581056966, "4": 0.03258494197261177, "3": 1.7956489075033072e-05, "2": 5.053286097047022e-08, "1": 1.1261263603180404e-08}, "score": 4.9673789457424675}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9558484132971128, "4": 0.044071917092348166, "3": 7.933064976695425e-05, "2": 2.9009482054834476e-07, "1": 2.749358863502257e-08}, "score": 4.95576844040397}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6001360496818597, "5": 0.39610094048284133, "3": 0.003751333133159038, "2": 1.0695633327774042e-05, "1": 5.961705816556144e-07}, "score": 4.392326578577088}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6590762141188622, "5": 0.3390608802389892, "3": 0.0018612332003701381, "2": 1.6272778009802043e-06, "1": 0}, "score": 4.337196407712149}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6005860382740857, "5": 0.39213861186405585, "3": 0.007249514339605114, "2": 2.4203967305360504e-05, "1": 1.359193566362573e-06}, "score": 4.384836716823802}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9764554439713051, "4": 0.023508787301550964, "3": 3.533625737670218e-05, "2": 2.9048555107945917e-07, "1": 6.546265562685755e-08}, "score": 4.976419405071996}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9714169919458883, "4": 0.02854692655466947, "3": 3.5734784064493914e-05, "2": 1.7547469367881112e-07, "1": 3.8979576791252995e-08}, "score": 4.971380917749622}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6253953932945475, "4": 0.3736344372806781, "3": 0.0009666493931235582, "2": 3.2990863218324527e-06, "1": 1.3421390550564395e-07}, "score": 4.624421797244055}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7426593786196418, "4": 0.2560167005773801, "3": 0.0013208365409107731, "2": 2.868971370291567e-06, "1": 1.805485717148522e-07}, "score": 4.741332288245735}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8760832748059806, "4": 0.12377909426432049, "3": 0.0001374888135729918, "2": 9.121185128575131e-08, "1": 0}, "score": 4.8759456481580825}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9591324816686919, "4": 0.040776208200520234, "3": 9.073385563355928e-05, "2": 3.995683490062874e-07, "1": 6.472553795169824e-08}, "score": 4.959040861894358}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6771800626608135, "4": 0.3214931956223914, "3": 0.0013249141686758616, "2": 1.7916349053899517e-06, "1": 7.033867831682362e-08}, "score": 4.675851330939796}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6340914005692191, "3": 0.35721054826452636, "5": 0.008319511831241846, "2": 0.0003773861213814502, "1": 1.1137208849078137e-06}, "score": 3.6503508363526915}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9536095538525733, "4": 0.04628323863298332, "3": 0.00010680530076913886, "2": 2.764847973375375e-07, "1": 3.59925451176362e-08}, "score": 4.953502173168362}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8462748079755888, "4": 0.15305587931298104, "3": 0.0006675208047572043, "2": 1.615133406592494e-06, "1": 1.6778104687131775e-07}, "score": 4.845603561164732}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.685026503655859, "4": 0.3086802276184733, "3": 0.0062818949524305265, "2": 1.0768676090770536e-05, "1": 4.865758684484824e-07}, "score": 4.678721692066604}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6655815028836755, "5": 0.3316809719215593, "3": 0.0027342174728690123, "2": 3.1947363279611654e-06, "1": 6.578328883129608e-08}, "score": 4.328940183152894}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8839471033272075, "4": 0.1156930402506707, "3": 0.00035813197293900164, "2": 1.5055082637492487e-06, "1": 1.9537579091960807e-07}, "score": 4.8835853950321715}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7556261769723002, "4": 0.24393389805554358, "3": 0.00043877272046033086, "2": 9.636728183470767e-07, "1": 1.3748390242034246e-07}, "score": 4.755185103040661}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6353851681241366, "4": 0.3635039919820326, "3": 0.0011095242046629274, "2": 1.0185464459622122e-06, "1": 0}, "score": 4.634273795296424}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9897762851357147, "4": 0.010215623652065724, "3": 7.980751324457127e-06, "2": 4.526340353246423e-08, "1": 0}, "score": 4.989768278387992}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8121226690270988, "5": 0.18340174582221166, "3": 0.004468109010589317, "2": 7.0846966609550486e-06, "1": 1.4084610451246422e-07}, "score": 4.178919089716634}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6920993806637395, "5": 0.3050168066873312, "3": 0.0028813020105450783, "2": 2.3483114969448113e-06, "1": 7.028727953151898e-08}, "score": 4.302130624999938}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5688464162542475, "4": 0.4297860294808065, "3": 0.0013662124538803694, "2": 1.3323663315126566e-06, "1": 7.183959862762641e-08}, "score": 4.56747728814124}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9235448419477642, "4": 0.07638189403245574, "3": 7.318185867655535e-05, "2": 6.437387202871876e-08, "1": 0}, "score": 4.923471547767346}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.562533343121449, "4": 0.4369014474629096, "3": 0.0005644552224604644, "2": 6.957130820774965e-07, "1": 1.9524612261183433e-08}, "score": 4.561967459790703}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5725645722257916, "4": 0.4258332249895887, "3": 0.001599864085351317, "2": 2.248035127371448e-06, "1": 1.125438402613315e-07}, "score": 4.570959861946234}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.882778825942423, "3": 0.09446853149426121, "5": 0.02264914898874018, "2": 0.0001030279239671679, "1": 3.24196507621266e-07}, "score": 3.9279735788685888}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7466174426474858, "5": 0.2412151271222777, "3": 0.012107647514887658, "2": 5.909637335421465e-05, "1": 6.454720031160085e-07}, "score": 4.228987359803384}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9700731363772089, "5": 0.015342400637704683, "3": 0.014574541576026343, "2": 9.827195152242527e-06, "1": 0}, "score": 4.000748204741866}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9770214795218612, "4": 0.02296341457878701, "3": 1.5001955480383345e-05, "2": 5.9532110362875395e-08, "1": 0}, "score": 4.9770064018927345}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5735715671787599, "4": 0.42566698660539104, "3": 0.0007598374721407299, "2": 1.443247175570261e-06, "1": 0}, "score": 4.572808938010162}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6703007075812697, "5": 0.19919012666395627, "3": 0.13020495410108762, "2": 0.0002994587138983347, "1": 4.5757863235748626e-06}, "score": 4.068372539888533}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9491993843685653, "4": 0.05059565378271596, "3": 0.00020448171493496465, "2": 3.9765342598553813e-07, "1": 5.709798556377647e-08}, "score": 4.948993960140539}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8312795489789717, "4": 0.16505460837305258, "3": 0.0036628919254587068, "2": 2.843653184038428e-06, "1": 7.525955233837855e-08}, "score": 4.827610770294606}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9937035472617585, "4": 0.006280487337500833, "3": 1.585602505847183e-05, "2": 6.41197761706191e-08, "1": 0}, "score": 4.99368760796738}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6712056943702742, "3": 0.31405419890224245, "5": 0.013805447753109351, "2": 0.0009303301823890387, "1": 4.294802445401539e-06}, "score": 3.697877693809754}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "human", "scores": {"4": 0.915697787551013, "5": 0.07654834323697374, "3": 0.007747072104239435, "2": 6.6486814576574224e-06, "1": 1.4945626929244242e-07}, "score": 4.068787525330164}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7555329988976341, "4": 0.24339632430530253, "3": 0.0010681548054766962, "2": 2.251119297246431e-06, "1": 1.6274032575338753e-07}, "score": 4.754459935213819}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7196671036019372, "4": 0.27639894611330434, "3": 0.003920594415767743, "2": 1.1960027620955676e-05, "1": 1.384673757809937e-06}, "score": 4.715718443102519}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.835306939049919, "4": 0.16408373535948936, "3": 0.0006035077353665797, "2": 4.807218093982447e-06, "1": 8.321617532977668e-07}, "score": 4.834691469364981}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8400203510481362, "4": 0.15971942449587506, "3": 0.00025969232319852643, "2": 4.955844816150327e-07, "1": 4.3304338961296465e-08}, "score": 4.839759531969517}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8146168573176902, "5": 0.18014172081836413, "3": 0.005238680632729813, "2": 2.557557132939159e-06, "1": 8.361741710321617e-08}, "score": 4.174897691718797}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6589609517689992, "5": 0.33878309979152255, "3": 0.0022518954391504346, "2": 3.842274688299122e-06, "1": 1.8527604293610322e-07}, "score": 4.336522972539241}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7590718819077705, "5": 0.2381356523079701, "3": 0.0027912632718947034, "2": 1.0777424809084623e-06, "1": 2.723428988688465e-08}, "score": 4.235342174802482}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7282190887321411, "5": 0.2711364172694291, "3": 0.0006440550848735113, "2": 4.1650682038475e-07, "1": 0}, "score": 4.270491535231748}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8834806013999441, "4": 0.11640538288937205, "3": 0.00011391374713705577, "2": 1.2286397350539157e-07, "1": 0}, "score": 4.883366423462125}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6067814088477126, "5": 0.3914254238291721, "3": 0.0017911485801859971, "2": 1.794615078440517e-06, "1": 0}, "score": 4.389630773345937}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7371455768820322, "5": 0.2585818501867878, "3": 0.004268342928552152, "2": 3.795019533358074e-06, "1": 0}, "score": 4.254306027837991}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7222989266090677, "4": 0.2755140647412179, "3": 0.002185266259421149, "2": 1.504227621207488e-06, "1": 0}, "score": 4.720110823397922}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9533777347579498, "4": 0.046607071520330105, "3": 1.5088797151377409e-05, "2": 3.941734062815276e-08, "1": 0}, "score": 4.95336262957826}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7404821284512704, "5": 0.2536514242409965, "3": 0.005833473840896715, "2": 3.2075181142873535e-05, "1": 6.54648753071427e-07}, "score": 4.247751896453069}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5217183479658297, "4": 0.4772640868984757, "3": 0.001017085596270204, "2": 4.4832877541089944e-07, "1": 3.0529085035705243e-08}, "score": 4.520700274479644}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9940393847754508, "4": 0.0059494904603953035, "3": 1.1101703421761829e-05, "2": 2.5696269788398495e-08, "1": 1.082933696365702e-08}, "score": 4.994028185807013}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6133717396580582, "4": 0.38445810333179126, "3": 0.0021697281408333768, "2": 4.7501640341631797e-07, "1": 3.12657371100513e-08}, "score": 4.611200920372418}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986549588797473, "4": 0.0013434324638299149, "3": 1.583512622077685e-06, "2": 1.0674031584782675e-08, "1": 0}, "score": 4.998653368469346}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9763714489810372, "4": 0.023599666462390475, "3": 2.885844173536125e-05, "2": 2.077902027259797e-08, "1": 0}, "score": 4.976342554190847}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "human", "scores": {"5": 0.776177738939963, "4": 0.22275900209550187, "3": 0.001058449687927373, "2": 4.3819181309429466e-06, "1": 4.193935909788909e-07}, "score": 4.775109273408659}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.4797165357714311, "4": 0.4656832020353768, "3": 0.052718491638475445, "2": 0.0018540543449450007, "1": 2.726709211243154e-05}, "score": 4.42320832423706}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5643332122935029, "4": 0.43382389461772447, "3": 0.0018403435736175503, "2": 2.3727332435463593e-06, "1": 9.567392898508925e-08}, "score": 4.562487881853867}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9966116666015808, "4": 0.0033821218506014765, "3": 6.049112444935224e-06, "2": 9.844606521537629e-08, "1": 4.7297613370728596e-08}, "score": 4.996605295339196}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989771220966152, "4": 0.0010218858358959524, "3": 9.385553552257124e-07, "2": 6.5775598753477725e-09, "1": 0}, "score": 4.998976217272664}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9937825478465113, "4": 0.006204221695636281, "3": 1.3127110006598145e-05, "2": 4.8153548723281206e-08, "1": 1.715376763997706e-08}, "score": 4.993769310771615}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7958024916451926, "5": 0.20241905515045733, "3": 0.0017764869294550041, "2": 1.922281108089049e-06, "1": 1.1381118882593282e-07}, "score": 4.20063836821717}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9494666937666077, "4": 0.050286310297625286, "3": 0.00024616192668967205, "2": 6.619909180905223e-07, "1": 7.16707587700481e-08}, "score": 4.949219088097474}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9898442608510909, "4": 0.010135042557746641, "3": 2.0498865803685e-05, "2": 1.0832281936608517e-07, "1": 2.23755945739751e-08}, "score": 4.989823544557713}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9924669636199728, "4": 0.007520158982153838, "3": 1.2780423140215083e-05, "2": 7.687769919165195e-08, "1": 0}, "score": 4.992454049386816}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9044757499083533, "5": 0.08279187917478999, "3": 0.012715154871017077, "2": 1.681999837551561e-05, "1": 2.7824967911971317e-07}, "score": 4.070042257808808}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6985626305168497, "4": 0.3008368162343274, "3": 0.0005998671763528142, "2": 5.780398650370868e-07, "1": 2.4939822844190586e-08}, "score": 4.6979615904368695}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7728822813695928, "4": 0.2267427191714219, "3": 0.00037369171197630717, "2": 1.1440934285825002e-06, "1": 7.814865427475467e-08}, "score": 4.772506133077877}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8903165992662972, "5": 0.10347507671094454, "3": 0.006194657821817268, "2": 1.3541019471478928e-05, "1": 1.954375394252887e-07}, "score": 4.097252743704971}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8530455270962743, "5": 0.14506911426785646, "3": 0.0018832749932633595, "2": 1.900814651001048e-06, "1": 2.4558519903473453e-08}, "score": 4.143181986631064}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7137369513502838, "5": 0.27571438114963676, "3": 0.010517360565163806, "2": 3.0145165376614126e-05, "1": 1.1247609879896374e-06}, "score": 4.265133365782956}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7127845059104426, "4": 0.28527170556672676, "3": 0.0019405231059724474, "2": 3.089371147197079e-06, "1": 2.0671268562172703e-07}, "score": 4.710837162124893}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9875728013877081, "4": 0.012364312253205383, "3": 6.262499990977277e-05, "2": 1.4465590263951454e-07, "1": 0}, "score": 4.9875100023216445}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7025631771020464, "4": 0.2965345029087515, "3": 0.0008993092403943661, "2": 2.820983429337862e-06, "1": 1.6938798229730515e-07}, "score": 4.701657732028803}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7127917692215643, "5": 0.28277504257593405, "3": 0.0044270271164857, "2": 5.990695753966814e-06, "1": 1.6629342308937083e-07}, "score": 4.278335536327967}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6950449425281078, "4": 0.2521245166031577, "2": 0.04915798420034626, "5": 0.0035385083878417276, "1": 0.00013394276180194194}, "score": 3.2097756857901585}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7184530284936407, "5": 0.2712896526300993, "3": 0.009861690251083606, "2": 0.00036668132916999686, "1": 2.866860317626638e-05}, "score": 4.2606086665409135}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9437387018879676, "4": 0.05619497156600628, "3": 6.609906212080219e-05, "2": 9.76476739679602e-08, "1": 1.0483743684904663e-08}, "score": 4.943672488708927}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9118025997304156, "4": 0.08784787092386225, "3": 0.00034856424414645603, "2": 9.052166768225174e-07, "1": 7.249675751622977e-08}, "score": 4.91145199606754}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8781101918288202, "4": 0.12165980657165179, "3": 0.00022960158275738617, "2": 3.4822012988885564e-07, "1": 2.389052261400793e-08}, "score": 4.877879846632454}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5251992839183842, "4": 0.47417401708923324, "3": 0.0006256950162942925, "2": 9.410985253743143e-07, "1": 3.250795527082545e-08}, "score": 4.524571625112207}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9752058354339205, "4": 0.024760028007679603, "3": 3.378343379614231e-05, "2": 2.1646715716895125e-07, "1": 9.3555592981556e-08}, "score": 4.975171380430726}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9946084215142641, "4": 0.005386308543653759, "3": 5.272589235674269e-06, "2": 1.2362798434322195e-08, "1": 0}, "score": 4.9946031092704875}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9596287529414873, "4": 0.040323857002899324, "3": 4.676970002877437e-05, "2": 3.017880159448429e-07, "1": 7.963413534718892e-08}, "score": 4.959581370039092}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9709963419496691, "4": 0.02895292626806642, "3": 5.036339179918563e-05, "2": 2.087158665746652e-07, "1": 4.262026468278252e-08}, "score": 4.970945546918726}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.876289730630661, "5": 0.11013225689577097, "3": 0.013554455046161816, "2": 2.2763754542196758e-05, "1": 6.479119690850497e-07}, "score": 4.096530344674967}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8936062920627297, "5": 0.09753318499151002, "3": 0.008833511191270169, "2": 2.6290497391064223e-05, "1": 6.345511109014627e-07}, "score": 4.088645196838194}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7649364121369372, "4": 0.23460162877779803, "3": 0.00046164147328581884, "2": 3.036882971140105e-07, "1": 3.1797696083160597e-08}, "score": 4.764474054229749}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9866757182225642, "4": 0.013310628866770584, "3": 1.3448593901779656e-05, "2": 6.741683990587406e-08, "1": 1.9790001530399115e-08}, "score": 4.986662190972909}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9943823980682244, "4": 0.005616000068844452, "3": 1.580794482943026e-06, "2": 4.50913724480984e-09, "1": 0}, "score": 4.994380824721728}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5450869258852703, "4": 0.45114111267689316, "3": 0.003760566379795496, "2": 1.0767933077754519e-05, "1": 4.1091806399539394e-07}, "score": 4.541303707918724}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9648993968950389, "3": 0.02438604589069253, "5": 0.01067057847552313, "2": 4.335693025678273e-05, "1": 4.003466660703386e-07}, "score": 3.9861966146273966}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9953378636541825, "4": 0.004657599930009851, "3": 4.5328440040474465e-06, "2": 3.659822847620497e-08, "1": 1.5523575012096065e-08}, "score": 4.995333162719571}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9865718657090058, "4": 0.013410155311342837, "3": 1.7706725832958383e-05, "2": 1.1085431224687588e-07, "1": 4.235234692620536e-08}, "score": 4.986553927663949}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8473486667320534, "4": 0.152266759444061, "3": 0.00038372189481961273, "2": 7.789090890531044e-07, "1": 4.5169172822006976e-08}, "score": 4.846963275100145}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9140359003656143, "5": 0.06826211851634854, "3": 0.01769935642912205, "2": 2.4059661728685574e-06, "1": 0}, "score": 4.050557961213057}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7019645603939334, "5": 0.2611000530756442, "3": 0.036903392296746725, "2": 2.9802687021832e-05, "1": 0}, "score": 4.224137546612744}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9219821552550401, "4": 0.07796421808867032, "3": 5.354945170813316e-05, "2": 7.903010350799236e-08, "1": 0}, "score": 4.921928446060125}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5680757877639391, "4": 0.4305459863627039, "3": 0.0013752221462555961, "2": 2.65962878345896e-06, "1": 0}, "score": 4.566695441359065}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7838024244669255, "4": 0.21591043717378305, "3": 0.0002863920161034818, "2": 2.746879804472383e-07, "1": 0}, "score": 4.783515852624193}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6828669504987619, "3": 0.30005499633816013, "5": 0.015896718097873207, "2": 0.0011767173782156744, "1": 4.1439049087524234e-06}, "score": 3.7134757195384855}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.825246920378097, "3": 0.17270060338540943, "2": 0.001132164830294986, "5": 0.000914526877671919, "1": 4.950569190571723e-06}, "score": 3.825934596960633}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5952845812288915, "5": 0.4029395412508041, "3": 0.0017726114929729332, "2": 2.9372699395855714e-06, "1": 8.66004348524285e-08}, "score": 4.401160892560548}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.988664215223615, "4": 0.011306704620118496, "3": 2.884467954119773e-05, "2": 1.1093704041758304e-07, "1": 1.279524780744662e-08}, "score": 4.988635220758736}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8201930988860638, "5": 0.17791794822414272, "3": 0.0018789033440030538, "2": 9.684653874990066e-06, "1": 1.9827656260687766e-07}, "score": 4.176019110070188}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7465208963226224, "4": 0.2527484635580333, "3": 0.0007286077766733176, "2": 1.7433421695375727e-06, "1": 1.9173569535063566e-07}, "score": 4.745788299193479}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5249092229539929, "5": 0.47056148893722693, "3": 0.004523977926228515, "2": 5.058214512894743e-06, "1": 1.1543445006459771e-07}, "score": 4.4660271119069765}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7579688721107057, "3": 0.23614352547919612, "5": 0.005764556834164674, "2": 0.000122556917896442, "1": 3.515518942624044e-07}, "score": 3.7693748312433657}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9907672678446399, "4": 0.009224800641191588, "3": 7.802350683437276e-06, "2": 3.553388815096612e-08, "1": 0}, "score": 4.990759487190592}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7258467605928994, "5": 0.26463147003520526, "3": 0.009495261445745744, "2": 2.5910740088011187e-05, "1": 2.815507841870425e-07}, "score": 4.2550836229703215}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8256818245273073, "4": 0.17362779154915317, "3": 0.0006894082065847571, "2": 9.365087235964442e-07, "1": 5.3915221300630467e-08}, "score": 4.824990369424486}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996244513760448, "4": 0.000374892889797406, "3": 6.140613470672554e-07, "1": 9.580433456557466e-09, "2": 0}, "score": 4.999623840653702}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.953018573510514, "4": 0.04683058799118188, "3": 0.00015044883475244525, "2": 2.5605156166340427e-07, "1": 3.690237222595697e-08}, "score": 4.952867594016983}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9968410624756584, "4": 0.0031518994748244945, "3": 6.922393269034507e-06, "2": 3.791666923678964e-08, "1": 2.3132899774816953e-08}, "score": 4.996834049284148}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.996064248153261, "4": 0.003930176276640049, "3": 5.550414213099132e-06, "2": 2.548377147815189e-08, "1": 1.132526235320183e-08}, "score": 4.996058601188499}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8895399998252688, "5": 0.10534588497577935, "3": 0.005105106324808148, "2": 8.753586988981202e-06, "1": 1.4205450712569696e-07}, "score": 4.100222856661971}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7985588926063426, "5": 0.19279290447470718, "3": 0.008643618292305432, "2": 4.579388884833423e-06, "1": 4.825202698461406e-08}, "score": 4.184139974727905}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9871782471208418, "4": 0.012816170308548598, "3": 5.543608031306098e-06, "2": 3.1959961937017204e-09, "1": 0}, "score": 4.987172732428612}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8543689096128719, "4": 0.14555045248516132, "3": 8.047387181113054e-05, "2": 1.0893624871469509e-07, "1": 1.2142028172364516e-08}, "score": 4.854288218135763}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9834097376792379, "4": 0.016586076510616995, "3": 4.174967433713588e-06, "2": 6.763603681186836e-09, "1": 0}, "score": 4.9834055531960155}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "human", "scores": {"5": 0.577715913655983, "4": 0.42024958256311373, "3": 0.002029186307556009, "2": 4.7921710638014255e-06, "1": 2.2220510171299053e-07}, "score": 4.575676650876964}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7263952070070997, "4": 0.27306926446189383, "3": 0.000534316605768037, "2": 1.2023819623408896e-06, "1": 5.787577116289089e-08}, "score": 4.725858276927551}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9586872387325832, "4": 0.04128060920684376, "3": 3.202214062122037e-05, "2": 2.4035594527510673e-08, "1": 0}, "score": 4.9586552700273705}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8331101272262141, "4": 0.16656101170774668, "3": 0.00032752636575738246, "2": 1.1329598652264246e-06, "1": 2.005324014528654e-07}, "score": 4.832779734349533}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5629578052055494, "5": 0.43681098764626386, "3": 0.00023117512911140583, "2": 8.316901286660195e-08, "1": 0}, "score": 4.436579623848106}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8703665797887754, "5": 0.12356886092043641, "3": 0.006049016391949378, "2": 1.5101008927270195e-05, "1": 1.6156149383124993e-07}, "score": 4.11748919076171}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9290723906566588, "5": 0.05990353263842357, "3": 0.011016005701395985, "2": 7.830603308780586e-06, "1": 1.873026648290268e-07}, "score": 4.048871306417363}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9610289361570145, "4": 0.038608466005212366, "3": 0.0003568116523000693, "2": 4.606035726880546e-06, "1": 1.0843151157551102e-06}, "score": 4.960659751552386}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7889829168644529, "4": 0.20997680641648972, "3": 0.0010292540113185187, "2": 1.0277207282205746e-05, "1": 7.316270114850034e-07}, "score": 4.787930924488852}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9698406377124975, "4": 0.030091732883052565, "3": 6.724788431346687e-05, "2": 3.5173263838331526e-07, "1": 3.3573022307332484e-08}, "score": 4.9697725819727445}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8174790528206448, "4": 0.1805544472285231, "3": 0.0019442344079342658, "2": 2.066826760147538e-05, "1": 1.3855671604751088e-06}, "score": 4.815489497821788}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.71113748455703, "4": 0.2884088175527667, "3": 0.0004481378822599404, "2": 4.333829481474922e-06, "1": 7.109654513182107e-07}, "score": 4.710678912270476}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6098491545611948, "4": 0.3885593709003616, "3": 0.0015883897686834322, "2": 2.7585455273049776e-06, "1": 1.3786746662933317e-07}, "score": 4.608254948667991}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9618449172420938, "4": 0.038049866622596296, "3": 0.00010431921340783382, "2": 6.660460664195168e-07, "1": 9.389957282472473e-08}, "score": 4.9617391159732644}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6962503813645273, "5": 0.28832129875828827, "3": 0.015381795179993442, "2": 4.528650376489746e-05, "1": 9.612599164278021e-07}, "score": 4.27284612235125}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6642003122003032, "5": 0.32629777313502667, "3": 0.00946590862985781, "2": 3.501013384340529e-05, "1": 9.706168885629522e-07}, "score": 4.316758940395776}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5145050543226088, "4": 0.4197217992144017, "2": 0.05914205009748129, "5": 0.00585330979972195, "1": 0.0007775120621592785}, "score": 3.3707314463591724}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.960843119957848, "4": 0.038935525234870046, "3": 0.00021845511235054482, "2": 2.0849159818505316e-06, "1": 6.201639241889651e-07}, "score": 4.960618821472617}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994736772164553, "4": 0.0005232394286977081, "3": 2.815071210189601e-06, "1": 1.374162769775748e-07, "2": 1.014208647693835e-07}, "score": 4.999470276485581}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8769424764835315, "3": 0.11153518247067222, "5": 0.00827686504526809, "2": 0.003174267442597299, "1": 7.100963399909023e-05}, "score": 3.890180096941598}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7201731714417692, "5": 0.2713164845035587, "3": 0.008492923429022137, "2": 1.6703053682801073e-05, "1": 3.750070541823477e-07}, "score": 4.26278911996834}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8242441783677811, "3": 0.17196384977249649, "5": 0.0034694715072807916, "2": 0.0003213325467173133, "1": 1.0570801776282568e-06}, "score": 3.8308597666726727}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.975158780937195, "5": 0.019530860004781648, "3": 0.005307547047941798, "2": 2.708715556013605e-06, "1": 7.87551629594406e-08}, "score": 4.014217659609132}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.568603854987582, "4": 0.43110158094534146, "3": 0.000294088445745083, "2": 4.3417810797177205e-07, "1": 3.928889217026337e-08}, "score": 4.56830878154327}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7227912688196004, "5": 0.2758086364324239, "3": 0.0013964420081607673, "2": 3.389734358387223e-06, "1": 1.4702620511011154e-07}, "score": 4.274405005702218}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6250680969880751, "5": 0.3716085736698814, "3": 0.0033152464971304687, "2": 7.768837645103302e-06, "1": 2.4501828415064436e-07}, "score": 4.368277079849671}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8925705507438627, "4": 0.10726562973467663, "3": 0.00016339793717599097, "2": 2.973107347877626e-07, "1": 2.7607620424378174e-08}, "score": 4.8924065616276655}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7915769926812024, "4": 0.20804330995880507, "3": 0.00037911400248464905, "2": 4.3774862799754176e-07, "1": 2.509626014794075e-08}, "score": 4.7911970232419065}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9087324559639951, "4": 0.09117702796310626, "3": 8.996309745467319e-05, "2": 4.0574132943899974e-07, "1": 4.5497657310334384e-08}, "score": 4.908641637332891}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.691494805386681, "4": 0.3078984063296374, "3": 0.0006056998449271146, "2": 1.025605898016933e-06, "1": 4.7615142811902784e-08}, "score": 4.690886921998249}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8838183004045888, "3": 0.07279412700805594, "5": 0.04332457729652083, "2": 6.254620464691234e-05, "1": 4.0268931614386825e-07}, "score": 3.9704041484380665}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7063694910255528, "3": 0.2906053842419134, "5": 0.0025522695398842374, "2": 0.0004720935938409855, "1": 7.742670476962604e-07}, "score": 3.711000378970262}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5623079361805068, "5": 0.4315264122582279, "3": 0.006160668405110926, "2": 4.719965819615103e-06, "1": 1.780098412965136e-07}, "score": 4.425355806123973}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8876726334367556, "4": 0.112093335730242, "3": 0.00023337592325722102, "2": 4.75456472326341e-07, "1": 1.0470300692979864e-07}, "score": 4.887438058827765}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6839895973690624, "4": 0.31536562467795154, "3": 0.0006437670634548396, "2": 7.842962641745032e-07, "1": 0}, "score": 4.683344416554323}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9517048888039406, "3": 0.042357067020968205, "5": 0.005889515162922649, "2": 4.806107307912466e-05, "1": 2.82530310022573e-07}, "score": 3.963435471625482}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9856608411945497, "4": 0.014321448075090405, "3": 1.7535923669441982e-05, "2": 5.5700985342448984e-08, "1": 1.1941429649628104e-08}, "score": 4.985643263670367}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9438221509532173, "5": 0.04627892523615013, "3": 0.009893087480634704, "2": 5.633751481347175e-06, "1": 9.473711421152072e-08}, "score": 4.036374289963864}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9760547107927682, "4": 0.02393794792367873, "3": 7.226172885843908e-06, "2": 7.040363743502936e-09, "1": 0}, "score": 4.976047576020912}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9262520769992458, "5": 0.04860814351867487, "3": 0.02504577821465203, "2": 9.332943613792646e-05, "1": 6.584132916391728e-07}, "score": 4.023373731505501}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7743757717415262, "5": 0.1896376183163762, "3": 0.035956895684859345, "2": 2.894511810838303e-05, "1": 7.100666486348475e-07}, "score": 4.153620711270111}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994749949541406, "4": 0.005209108245285878, "3": 4.0841248280109895e-05, "2": 1.1692817260817347e-07, "1": 3.570061219459015e-08}, "score": 4.994708715944556}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9897662399471713, "4": 0.010189386903951702, "3": 4.414164014644045e-05, "2": 1.50086656449021e-07, "1": 3.9760495220167576e-08}, "score": 4.989721720085597}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9041072646886005, "4": 0.0953853191200801, "3": 0.0005061168431588272, "2": 1.1627542659540993e-06, "1": 6.573449573546029e-08}, "score": 4.903598689161883}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9732943855835057, "4": 0.026407553297438446, "3": 0.00029595948145098763, "2": 1.7183448963181184e-06, "1": 3.4992289735587727e-07}, "score": 4.972993972112194}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8965236687524124, "3": 0.05976679737885003, "5": 0.04354770391655213, "2": 0.00016055275143776214, "1": 1.2643517724110838e-06}, "score": 3.983456007766936}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9324750666486773, "4": 0.06740900261689138, "3": 0.00011549388189632571, "2": 3.021750051976789e-07, "1": 6.671266646699828e-08}, "score": 4.932358831646411}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9359270439876602, "4": 0.0639113891193942, "3": 0.00016133719568597342, "2": 1.8139044033864167e-07, "1": 2.837464137475122e-08}, "score": 4.935765277539009}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8733050123742718, "4": 0.12634608891497526, "3": 0.00034773286579226987, "2": 1.0711807641731072e-06, "1": 8.55704349120377e-08}, "score": 4.87295488837409}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.624472697092461, "4": 0.37491505450183404, "3": 0.0006108757345006317, "2": 1.243194849847089e-06, "1": 6.159260637441801e-08}, "score": 4.623859192540341}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.890596104608312, "5": 0.10195043654692718, "3": 0.007447988373735977, "2": 5.299643520241859e-06, "1": 9.72366635095949e-08}, "score": 4.094491564129874}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.920909745250023, "3": 0.0733361949510099, "5": 0.004999146905525481, "2": 0.0007510990680900089, "1": 3.5548773358070357e-06}, "score": 3.9301500710988275}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.91654108001086, "4": 0.08337131280101114, "3": 8.738918713038668e-05, "2": 1.4258593020473447e-07, "1": 1.2995054174357106e-08}, "score": 4.916453423871742}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7575161664334573, "5": 0.24100998857043637, "3": 0.0014677180958943253, "2": 5.307046989014985e-06, "1": 2.9330054582095733e-07}, "score": 4.239530902604565}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9809548783895832, "4": 0.019037425006882516, "3": 7.718388185405181e-06, "2": 2.1815720569440115e-08, "1": 0}, "score": 4.980947073600299}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7470027891906491, "5": 0.2497016184848387, "3": 0.0032913768707650342, "2": 4.011035983549781e-06, "1": 1.500223580936388e-07}, "score": 4.246401782878157}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.953087110399508, "4": 0.046731697370493853, "3": 0.0001800941118676582, "2": 9.41400666492014e-07, "1": 1.4497855529218033e-07}, "score": 4.9529047097367025}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.931535052017551, "4": 0.06839069511074763, "3": 7.411274819804859e-05, "2": 7.353679086335152e-08, "1": 1.608308079207426e-08}, "score": 4.931460790988681}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9676919053155196, "4": 0.032233886629405205, "3": 7.371730375229835e-05, "2": 3.1828997455404567e-07, "1": 7.164861592683376e-08}, "score": 4.967617434034128}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9924464177815626, "4": 0.007550385933558643, "3": 3.0967976392575274e-06, "2": 1.6280089155580536e-08, "1": 0}, "score": 4.99244337100213}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "human", "scores": {"4": 0.861195481719102, "5": 0.11182400807898951, "3": 0.026899408001384104, "2": 8.041868566608005e-05, "1": 5.793129526230344e-07}, "score": 4.08476203359978}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9227812559838143, "4": 0.07678290920397395, "3": 0.00042936653924368647, "2": 5.617768707668797e-06, "1": 7.434554441579563e-07}, "score": 4.922338522276069}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5037621232529537, "4": 0.48623885724673405, "3": 0.009971977197261343, "2": 2.660003570192205e-05, "1": 3.5063852059540603e-07}, "score": 4.493735939309173}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7760387301944414, "5": 0.21404964604532514, "3": 0.009761267697039196, "2": 0.00014754387039501266, "1": 2.443334141426441e-06}, "score": 4.203986035847086}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.613367587145437, "5": 0.3672686435258185, "3": 0.019229463863179207, "2": 0.00013143094202400492, "1": 2.8159778090738707e-06}, "score": 4.34776789020549}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8452477747928273, "4": 0.15119003855194713, "3": 0.0035043174974849624, "2": 4.681410554118469e-05, "1": 1.079483261400079e-05}, "score": 4.841617663591817}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7498363921864424, "4": 0.2479834670897618, "3": 0.0021583397221489812, "2": 2.0735880515249133e-05, "1": 9.047248252314425e-07}, "score": 4.747633986446517}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7081421136051984, "4": 0.29133134994121074, "3": 0.0005261332764709388, "2": 3.9910751308500273e-07, "1": 4.01231244206231e-08}, "score": 4.707615036232317}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.921443257502353, "4": 0.07849652678104953, "3": 5.9846596185518775e-05, "2": 2.285533899172865e-07, "1": 4.407504886432578e-08}, "score": 4.921382910480296}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9801062841341796, "4": 0.019882987746234013, "3": 1.067948976912455e-05, "2": 1.698349239905749e-08, "1": 0}, "score": 4.980095601693849}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8647058393524378, "4": 0.12959440076124779, "2": 0.003989449609805221, "5": 0.001698530692789949, "1": 1.1499511520218055e-05}, "score": 3.128979049637428}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9982699150254125, "4": 0.0017279981140623012, "3": 2.0595892257959856e-06, "2": 1.4350199390915471e-08, "1": 0}, "score": 4.998267839634506}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.777546911822298, "4": 0.22168329827432565, "3": 0.0007681529430860266, "2": 1.3353421590996207e-06, "1": 2.3246178291247044e-07}, "score": 4.776775444528499}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986308191845134, "4": 0.0013681968143379668, "3": 9.58973879174131e-07, "2": 5.540035102588391e-09, "1": 0}, "score": 4.998629868591098}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9925522251566262, "4": 0.00744260319153117, "3": 5.181406569703517e-06, "2": 1.065280073022648e-08, "1": 0}, "score": 4.992547002189024}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7402257586902524, "5": 0.25483533181581086, "3": 0.004932129188921911, "2": 6.623649870451689e-06, "1": 1.7373129725380723e-07}, "score": 4.249889429866107}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.538181185227876, "4": 0.4593063786421159, "3": 0.0025092198271285736, "2": 3.0880430031752144e-06, "1": 1.595641182822589e-07}, "score": 4.53566529385379}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7151644948651812, "5": 0.2812583322850347, "3": 0.0035702701992150455, "2": 6.5583140015523026e-06, "1": 2.576862699263184e-07}, "score": 4.277674196459558}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5245269868202098, "5": 0.4743517233846319, "3": 0.00111941281889035, "2": 1.8614179908805453e-06, "1": 5.157643266968577e-08}, "score": 4.4732284159556475}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7828296009363104, "4": 0.2168695626391071, "3": 0.0003002449249183973, "2": 5.306739682711074e-07, "1": 6.085900753227815e-08}, "score": 4.7825281120603655}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9356663731371921, "5": 0.04644027502557397, "3": 0.017865978805621255, "2": 2.7178128700798834e-05, "1": 1.6218632634838384e-07}, "score": 4.028519454336632}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8294922851480603, "5": 0.15616049289129597, "3": 0.014331285990945386, "2": 1.5799346176843734e-05, "1": 1.4676678596641305e-07}, "score": 4.141797166469352}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5812079318567526, "5": 0.41818784393389313, "3": 0.0006037144117961548, "2": 5.093497116623112e-07, "1": 1.6903417779345294e-08}, "score": 4.417583053240852}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8953850891848923, "5": 0.09736119074956856, "3": 0.007206192162486985, "2": 4.684819861839307e-05, "1": 5.946094699023934e-07}, "score": 4.090059526025048}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9304895718517281, "3": 0.040989440263478616, "5": 0.02840723252112848, "2": 0.00011285756737668847, "1": 6.012590281530534e-07}, "score": 3.9871902695472494}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8920329567995118, "5": 0.10322310142171064, "3": 0.004740403596305734, "2": 3.455535914632039e-06, "1": 2.6681563918019807e-08}, "score": 4.098475712220076}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7683856449527062, "5": 0.22986699958297657, "3": 0.0017463978217664806, "2": 8.638730602009734e-07, "1": 0}, "score": 4.228118895405682}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5236576436507219, "4": 0.4754353349693459, "3": 0.0009064542480775433, "2": 6.023085388054311e-07, "1": 2.689713665651245e-08}, "score": 4.522749871645075}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9814720426313883, "4": 0.0185075837215866, "3": 2.0373194831282156e-05, "2": 6.067597598547455e-08, "1": 0}, "score": 4.981451488977885}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9770016774511892, "4": 0.022983541641671996, "3": 1.4710927102706401e-05, "2": 3.5633522460728107e-08, "1": 0}, "score": 4.976986928813136}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7255737048639546, "5": 0.2718390542861918, "3": 0.002582288390796334, "2": 4.725685160584651e-06, "1": 1.756172369948325e-07}, "score": 4.269246801447132}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7384773852686709, "5": 0.24916872538620174, "3": 0.012296027945714633, "2": 5.5777555537731626e-05, "1": 1.8914723708216899e-06}, "score": 4.2367555134573145}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7849803761870738, "4": 0.21443026464988324, "3": 0.000587452597680678, "2": 1.5732862080407147e-06, "1": 2.385349491588253e-07}, "score": 4.784389135728455}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6234637843448095, "5": 0.3749367102207932, "3": 0.0015968489465137774, "2": 2.555210372818821e-06, "1": 7.463800567624637e-08}, "score": 4.373334536884965}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8577758334546932, "4": 0.1419616114260431, "3": 0.00026156702435905485, "2": 8.970152266034246e-07, "1": 6.572588508052918e-08}, "score": 4.857512296963415}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8772460212581511, "5": 0.10812741269898446, "3": 0.014609333115757994, "2": 1.6871647628379454e-05, "1": 1.809626826756284e-07}, "score": 4.093483810256623}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7563981409207268, "4": 0.2430418811696115, "3": 0.0005589846751183973, "2": 8.862444690196997e-07, "1": 6.843071933870931e-08}, "score": 4.755837207609107}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9106701972913556, "4": 0.0890190132538809, "3": 0.0003104784696179286, "2": 1.7183141261813276e-07, "1": 0}, "score": 4.910359501838835}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9994240187409277, "4": 0.0005739245019496156, "3": 1.9597375436286746e-06, "2": 2.983284109734989e-08, "1": 2.0040031277048545e-08}, "score": 4.9994219863370635}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9437208653950573, "4": 0.05622586481106508, "3": 5.2869814305919405e-05, "2": 3.000190092892927e-07, "1": 0}, "score": 4.943667489872266}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7727739154138139, "4": 0.2258374017340807, "3": 0.0013821565253892302, "2": 5.811435172280863e-06, "1": 7.202625778224456e-07}, "score": 4.771377971087249}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6793331933007215, "4": 0.31744623930821037, "3": 0.0032104643338873263, "2": 9.239128453256842e-06, "1": 9.134721031667188e-07}, "score": 4.676101476797268}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.86592515521791, "5": 0.12566465352820608, "3": 0.008402757946971283, "2": 7.25603515650401e-06, "1": 0}, "score": 4.117247404295575}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.881457730571101, "4": 0.11793289532085005, "3": 0.0006040316262857629, "2": 4.056317563466519e-06, "1": 1.0517396029512929e-06}, "score": 4.8808426375820595}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7124765355094057, "5": 0.2855827641364819, "3": 0.0019384311861255275, "2": 2.1661503459465876e-06, "1": 6.005920567518977e-08}, "score": 4.283639832656769}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "human", "scores": {"4": 0.903810363034692, "5": 0.08167874255634851, "3": 0.014491398680693013, "2": 1.908173429710971e-05, "1": 1.6344602883046097e-07}, "score": 4.0671487068929455}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.64413258289911, "5": 0.3464874431895586, "3": 0.009341457403458542, "2": 3.715615949020577e-05, "1": 1.0898439904440475e-06}, "score": 4.337068495113656}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9923853569130731, "4": 0.007589757029580257, "3": 2.464062633948676e-05, "2": 1.4043065903480713e-07, "1": 3.5935757734333305e-08}, "score": 4.992360396155108}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9669372084711432, "4": 0.03302258690431328, "3": 4.000232422153595e-05, "2": 1.0541456737503487e-07, "1": 2.159610203249464e-08}, "score": 4.96689700332682}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8165810306812625, "4": 0.1828932737174395, "3": 0.0005239704858202745, "2": 1.600323918733784e-06, "1": 1.2134440647321914e-07}, "score": 4.816053498327446}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8948155422438213, "4": 0.08278213514405856, "2": 0.022144259076281602, "5": 0.00021663275746465835, "1": 4.120973677664499e-05}, "score": 3.0609887355902003}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7641593792409964, "5": 0.23154987173415784, "3": 0.004289141425447501, "2": 1.470413359151958e-06, "1": 4.977609441476485e-08}, "score": 4.227257660018288}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8183765158126678, "5": 0.17634273846212614, "3": 0.005279226965668482, "2": 1.4157431080785233e-06, "1": 0}, "score": 4.171060697632304}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8565234694647293, "5": 0.13754089333764122, "3": 0.005930708475535461, "2": 4.811681262963769e-06, "1": 4.6684482873610245e-08}, "score": 4.131600430705058}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.821818131189487, "5": 0.17476971253921628, "3": 0.0034088646170704266, "2": 3.05385143008047e-06, "1": 3.641190701491698e-08}, "score": 4.171354665492833}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8992382616325727, "4": 0.06984181359031025, "2": 0.030681859340520708, "5": 0.0001840025392828944, "1": 5.3843654386295855e-05}, "score": 3.0394202806622}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7805212915707059, "3": 0.2160561394945677, "5": 0.0029088862587792162, "2": 0.0005123415835514774, "1": 1.328183949915395e-06}, "score": 3.7858240762805813}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.570337493221847, "4": 0.4290001544632453, "3": 0.000662120761155255, "2": 2.346189800783035e-07, "1": 0}, "score": 4.5696749014765485}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8283614052963315, "5": 0.16393401166925622, "3": 0.00769505780268161, "2": 9.431730198944734e-06, "1": 8.07130955792366e-08}, "score": 4.156219850264697}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.919979266137568, "5": 0.07653093046966469, "3": 0.0034877770295256892, "2": 2.0044015912153024e-06, "1": 0}, "score": 4.073039146241016}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6955067655916702, "5": 0.27509070481733555, "3": 0.029308491284872583, "2": 9.176294417996816e-05, "1": 2.1941847340448855e-06}, "score": 4.245592125026383}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.755463946337285, "4": 0.24217431553442406, "3": 0.0023543208017764534, "2": 6.7694277631270515e-06, "1": 5.809477588836973e-07}, "score": 4.753094394257122}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5165499946726559, "5": 0.48154550281363795, "3": 0.0019020272270565768, "2": 2.3001712069389106e-06, "1": 2.516159298336942e-07}, "score": 4.47963808370383}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9684762847616883, "4": 0.031470845544355155, "3": 5.2568840483285185e-05, "2": 1.5284415950055995e-07, "1": 6.628335679504068e-08}, "score": 4.968423290528135}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.501399946479536, "5": 0.49098318412108327, "3": 0.007596096363711047, "2": 1.98005270882385e-05, "1": 8.592215775253437e-07}, "score": 4.483344963795166}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8598696508511708, "5": 0.130211724934741, "3": 0.009916228713285562, "2": 2.439291328461273e-06, "1": 4.676975984642349e-08}, "score": 4.120290466435979}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8785740706478089, "5": 0.11155954441475127, "3": 0.009838633003274923, "2": 2.7409880702334592e-05, "1": 2.6995353104525036e-07}, "score": 4.101665289119538}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.864179946890198, "3": 0.0774094664739671, "5": 0.058366347306061356, "2": 4.367581681504887e-05, "1": 4.459941507155074e-07}, "score": 3.9808681889676643}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5882051719843092, "5": 0.41068351401955183, "3": 0.0011098464572807769, "2": 1.4321911696170513e-06, "1": 6.270949282812077e-08}, "score": 4.409570603844862}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.794172616682423, "5": 0.19640361046651753, "3": 0.009408547446992967, "2": 1.4769460335047311e-05, "1": 3.3691303374538556e-07}, "score": 4.186964535614272}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9354801238933591, "5": 0.04668598343204207, "3": 0.01780684224070345, "2": 2.6769403047220928e-05, "1": 1.6289581699973438e-07}, "score": 4.0288251171030485}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7710785499489872, "5": 0.21913329091353478, "3": 0.009783191685155351, "2": 4.784418815987053e-06, "1": 9.764923634324252e-08}, "score": 4.209340255317401}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8755101622118074, "3": 0.09502664053591217, "5": 0.02939495552915881, "2": 6.799645408205107e-05, "1": 2.6347772701366835e-07}, "score": 3.934231532849459}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7485180803275222, "3": 0.24019084118918504, "2": 0.0066886334049921035, "5": 0.004574494857554397, "1": 2.7697677307542516e-05}, "score": 3.7509232309237586}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.7904953141928165, "2": 0.142354920449527, "4": 0.06640149551082458, "5": 0.0004448569892149201, "1": 0.0003032906412981021}, "score": 2.9243296985089855}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9903756345302283, "4": 0.009243127283451839, "3": 0.0001908801144544822, "1": 0.00018059312233780088, "2": 6.985898086038702e-06}, "score": 4.98963175349014}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7758444111479137, "4": 0.22236964816441776, "3": 0.0016734816540436867, "1": 7.630733428359451e-05, "2": 3.316193088665351e-05}, "score": 4.773877997345271}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7965080045721363, "4": 0.1944632266238867, "3": 0.008816767259640541, "2": 0.00013618858204931798, "1": 7.524290082362396e-05}, "score": 4.78719358019465}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9744090171651484, "4": 0.02547477836523768, "3": 0.00011135168855325375, "1": 2.2001643408578656e-06, "2": 1.8720583696993863e-06}, "score": 4.974288081355532}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7389455066963245, "4": 0.2568009520020784, "3": 0.00412217641100503, "2": 0.00010276045067784183, "1": 2.754446362252809e-05}, "score": 4.7345359545837935}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7434783295822274, "5": 0.25116635260396813, "3": 0.005346831160529841, "2": 8.313769016459353e-06, "1": 2.0315085618005427e-07}, "score": 4.245802277013238}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9906535392439899, "4": 0.009329974474301433, "3": 1.631422714280441e-05, "2": 8.704070100895032e-08, "1": 2.745449308147845e-08}, "score": 4.990637025592412}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9886121382133494, "4": 0.011365332109218645, "3": 2.2232975239720702e-05, "2": 1.3499123318324564e-07, "1": 3.15507965831684e-08}, "score": 4.988589669278245}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9029372577351625, "4": 0.09695230717505468, "3": 0.00011005514495686047, "2": 2.7209787522217317e-07, "1": 2.4371583353501658e-08}, "score": 4.902826660643493}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6420346338117341, "4": 0.3556454753792809, "3": 0.0023103066831322086, "2": 9.233309635451345e-06, "1": 1.3326489470463991e-07}, "score": 4.639705599883445}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5676265834284865, "4": 0.43186953442333503, "3": 0.0005027284472233573, "2": 8.707934756303469e-07, "1": 0}, "score": 4.567122273837445}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8953424618109128, "3": 0.05809634069396184, "5": 0.04594378936654583, "2": 0.0006122431808782907, "1": 4.9325769429124675e-06}, "score": 3.986608161468127}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9171071271944436, "4": 0.08265150050082387, "3": 0.00024015668343230304, "2": 9.943515706674527e-07, "1": 1.0707396281714434e-07}, "score": 4.916864765288056}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8938247250690908, "3": 0.05294995800721016, "5": 0.052116024788535796, "2": 0.0010984971067081707, "1": 1.045889233761776e-05}, "score": 3.996937694861545}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5213626052205382, "4": 0.4774274011962936, "3": 0.0012088915664484419, "2": 1.0316304975788985e-06, "1": 0}, "score": 4.520151687004608}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7283777339744589, "5": 0.25800866741320005, "3": 0.013528577216709959, "2": 8.138480281421627e-05, "1": 3.5296282647519286e-06}, "score": 4.24430675783823}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9856071093584008, "4": 0.014365317276807212, "3": 2.7295846778565095e-05, "2": 1.1182988547566171e-07, "1": 7.467264574675509e-08}, "score": 4.985579455536904}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8770568196974876, "4": 0.12257765885768841, "3": 0.00036518809804965955, "2": 3.1517714219788463e-07, "1": 4.831793597409977e-08}, "score": 4.876690829860605}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.948117541015565, "4": 0.05182090187526036, "3": 6.128324991973216e-05, "2": 1.88603482860653e-07, "1": 3.982758795839395e-08}, "score": 4.94805580414437}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9344540724034845, "4": 0.06539146065948502, "3": 0.00015346914820968142, "2": 7.9904705543849e-07, "1": 8.804929577928562e-08}, "score": 4.9342988444331235}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7592504669816234, "4": 0.23546831926241749, "3": 0.005208694658510816, "2": 6.045640688511267e-05, "1": 1.1947494103839687e-05}, "score": 4.753885103871925}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6250162372394994, "5": 0.37141052193463847, "3": 0.0035525536360250937, "2": 1.9643010159600576e-05, "1": 8.288994333218227e-07}, "score": 4.367816274763572}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6871242460877656, "4": 0.3122343660265465, "3": 0.0006409103310413933, "2": 4.1175513368515913e-07, "1": 3.948969836262579e-08}, "score": 4.686482411838586}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5013343877088602, "5": 0.4979284933090604, "3": 0.0007352874843902862, "2": 1.7386910464355578e-06, "1": 1.195895947060743e-07}, "score": 4.497189356357594}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8148744635984678, "4": 0.18490596138101553, "3": 0.00021886750745878414, "2": 5.342173811584856e-07, "1": 0}, "score": 4.814654668832379}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.638980992975028, "5": 0.35897088286814915, "3": 0.002044485725677086, "2": 3.5240417592609836e-06, "1": 1.3180714571462114e-07}, "score": 4.356918947420788}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.751007365256836, "4": 0.24878368376256826, "3": 0.00020847091976539987, "2": 5.127292032786435e-07, "1": 3.4513440812879024e-08}, "score": 4.75079771489839}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8116611734336588, "5": 0.1854956958813116, "3": 0.0028402207527167132, "2": 2.7337397893409867e-06, "1": 7.441159950011704e-08}, "score": 4.182649803004483}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8377890587965415, "5": 0.1611734926638689, "3": 0.0010364909058805639, "2": 9.092943298179646e-07, "1": 3.100671633376086e-08}, "score": 4.160135092924747}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6897006611087285, "5": 0.3090597670234242, "3": 0.0012360191828029025, "2": 3.4201710278392296e-06, "1": 1.4648277385652496e-07}, "score": 4.307816463750431}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "human", "scores": {"4": 0.862718153900493, "3": 0.1235121681793044, "5": 0.013103878813083511, "2": 0.0006619033563971068, "1": 3.946624110686118e-06}, "score": 3.8882560697334445}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7642607593486404, "5": 0.23110930466659604, "3": 0.004621796946735007, "2": 7.794961457363377e-06, "1": 1.9050888558054522e-07}, "score": 4.226471381048975}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5077318119701273, "4": 0.4911840520505884, "3": 0.0010834845461365561, "2": 6.272297098569272e-07, "1": 2.4293524587308266e-08}, "score": 4.506647000038355}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9494269318835392, "4": 0.050477060168226215, "3": 9.550929360278489e-05, "2": 3.728912555086449e-07, "1": 8.842270998617043e-08}, "score": 4.949330446987927}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6935515561703975, "4": 0.30535788402900216, "3": 0.001087561440049572, "2": 2.8243706413738254e-06, "1": 2.2136321006817436e-07}, "score": 4.692457649095432}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8645482092000786, "3": 0.09357588196646449, "5": 0.041812225756629275, "2": 6.34381590383664e-05, "1": 1.4195552963189387e-07}, "score": 3.948109036262688}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945188008900375, "4": 0.00547831175166829, "3": 2.8800180398477875e-06, "2": 4.124731129547004e-09, "1": 1.700958366038625e-09}, "score": 4.99451590902592}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5113522968513529, "4": 0.4876715270841773, "3": 0.0009758594383566342, "2": 2.9439777731538385e-07, "1": 1.1121296090665605e-08}, "score": 4.510375820922317}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9986632700204955, "4": 0.0013350707396925792, "3": 1.6248939595067037e-06, "2": 1.6462578524287574e-08, "1": 5.448175799440777e-09}, "score": 4.998661608275306}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8468102884466051, "4": 0.15311241328756722, "3": 7.716103163044407e-05, "2": 1.0782373785241551e-07, "1": 4.322015467868012e-09}, "score": 4.846732920044665}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9931467156019423, "4": 0.00682577084477133, "3": 2.737298444823445e-05, "2": 9.48701236670748e-08, "1": 5.6136646634107494e-08}, "score": 4.9931189741012}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9933060681486545, "4": 0.006673061692575008, "3": 2.0800843899264556e-05, "2": 6.096749400321935e-08, "1": 0}, "score": 4.993285153661093}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9780243661440058, "4": 0.02192329080949579, "3": 5.2216448883632416e-05, "2": 7.248276699215792e-08, "1": 2.0572265566356254e-08}, "score": 4.977971975816497}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967496244452763, "4": 0.0032423821105942788, "3": 7.866754259347434e-06, "2": 7.185540507797043e-08, "1": 0}, "score": 4.996741668636003}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.56475577382683, "5": 0.4340733716800505, "3": 0.00116922750543455, "2": 1.4789458314864557e-06, "1": 5.1909189541065445e-08}, "score": 4.432901072171316}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7934090534612273, "4": 0.20651017379959882, "3": 8.063675459893583e-05, "2": 4.4525133921191154e-08, "1": 5.219631663966691e-09}, "score": 4.793328380413954}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7922574792010028, "5": 0.20460102821264303, "3": 0.0031395901909995103, "2": 1.8548847374146813e-06, "1": 3.222426811801562e-08}, "score": 4.201457634658917}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.849708516562534, "4": 0.1498663622983811, "3": 0.0004246135911094628, "2": 4.132037600135308e-07, "1": 4.691881824840292e-08}, "score": 4.849282976085033}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8925550737046991, "4": 0.10738824001174112, "3": 5.6531135545178026e-05, "2": 1.0747549165239765e-07, "1": 1.789187746483557e-08}, "score": 4.892498300521715}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6295382278615156, "4": 0.36995799752147634, "3": 0.0005033181916955405, "2": 5.2661294919223e-07, "1": 2.0798603331867607e-08}, "score": 4.629033736814696}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7359328726877791, "4": 0.26352645962708626, "3": 0.0005396374676878548, "2": 9.094652932220265e-07, "1": 1.1595217677817521e-07}, "score": 4.7353910719628365}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9480458470778953, "4": 0.05191630896116666, "3": 3.764512854517754e-05, "2": 9.8007679411901e-08, "1": 1.1150695101964928e-08}, "score": 4.948008057493598}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8064509513042597, "4": 0.1933357044090973, "3": 0.00021281144905369536, "2": 4.4955708249829176e-07, "1": 4.449856034924072e-08}, "score": 4.806237138512805}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9887024401927678, "4": 0.01129216225129404, "3": 5.294460355334288e-06, "2": 1.0866436700461576e-08, "1": 0}, "score": 4.988697215186239}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9001600663243718, "4": 0.09966216126303869, "3": 0.00017728020465309946, "2": 4.1371231333452385e-07, "1": 3.9492936650659483e-08}, "score": 4.899981875317992}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7448557377182444, "3": 0.24731031372672643, "5": 0.0073370311034452315, "2": 0.0004943681872837561, "1": 2.2452650081888257e-06}, "score": 3.759031171952774}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8913910401109045, "3": 0.07862068863468567, "5": 0.02970430482720105, "2": 0.0002826477882280202, "1": 1.181517415815785e-06}, "score": 3.95051476927832}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.629300055661115, "4": 0.3666028754664337, "3": 0.004092695825567406, "2": 4.321322795139974e-06, "1": 4.411027890089377e-08}, "score": 4.625198589619264}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982794129100478, "4": 0.001719886463377075, "3": 7.105660009906252e-07, "1": 0, "2": 0}, "score": 4.99827869242173}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8709578551845686, "3": 0.11709578545696285, "5": 0.010093550736798877, "2": 0.0018455148295641651, "1": 7.116169278564837e-06}, "score": 3.8892853674474264}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8708272909702574, "5": 0.11840747796955509, "3": 0.010758566048471448, "2": 6.5501670816080755e-06, "1": 4.3093054556641517e-08}, "score": 4.107635690030787}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9007068275052075, "5": 0.057735768087203335, "3": 0.04151672171539758, "2": 4.0484596076133555e-05, "1": 2.5961969195626625e-07}, "score": 4.016137297327754}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.785291415619527, "4": 0.21440273357143527, "3": 0.000305713551696295, "2": 1.1233144561697709e-07, "1": 1.185964946362959e-08}, "score": 4.784985452082804}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9532066779114885, "4": 0.046727575816548975, "3": 6.551987671895897e-05, "2": 2.0908457536896264e-07, "1": 1.910828168110465e-08}, "score": 4.953140680827397}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5122462359307167, "5": 0.48695746528068495, "3": 0.0007930208849842505, "2": 3.0381979436644468e-06, "1": 2.372607712655276e-07}, "score": 4.486157657406107}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9321342720036466, "3": 0.05917729743006708, "5": 0.008583106225977221, "2": 0.00010464603478953574, "1": 4.860015615428248e-07}, "score": 3.9491950489516534}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8379490666509636, "4": 0.16180866856328754, "3": 0.00024167710490503424, "2": 5.008210426360627e-07, "1": 3.35997906718877e-08}, "score": 4.83770633172085}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5205455930743033, "4": 0.4778271130956532, "3": 0.0016257604555814285, "2": 1.3968372278156416e-06, "1": 8.389917975341536e-08}, "score": 4.5189168145615}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8928770406743951, "4": 0.10700935697276674, "3": 0.00011317502995089083, "2": 3.193580339694644e-07, "1": 0}, "score": 4.892763323315438}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9161289949880911, "3": 0.06057157229581749, "5": 0.02179884265100122, "2": 0.0014869393487435703, "1": 1.3503778807786085e-05}, "score": 3.9582128741811755}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8769883242346519, "5": 0.12022563621055178, "3": 0.002782495756174788, "2": 3.4744721144421103e-06, "1": 5.3935065753224323e-08}, "score": 4.11743603151246}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6752728821181236, "4": 0.32394753672148036, "3": 0.0007782939323960199, "2": 1.1193034340749637e-06, "1": 1.0042757660725805e-07}, "score": 4.674492093822315}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.505403600496598, "5": 0.49277774405930014, "3": 0.0018177394687761068, "2": 7.866558324492344e-07, "1": 1.3156642234045195e-07}, "score": 4.490958035476444}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.994215987184239, "4": 0.0057802230909067935, "3": 3.754516660279563e-06, "1": 1.9794316221016935e-08, "2": 0}, "score": 4.994212188609296}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.98758698303496, "4": 0.012401712637262542, "3": 1.1225472855630397e-05, "2": 3.566485809696553e-08, "1": 1.0562287107174708e-08}, "score": 4.987575686767925}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8255805691174559, "5": 0.17038702701946934, "3": 0.004030020968239438, "2": 2.2080671894673974e-06, "1": 0}, "score": 4.166352618999888}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5677361459315297, "4": 0.43118489075254535, "3": 0.001076813243724122, "2": 2.0942208145521042e-06, "1": 1.0326988839236034e-07}, "score": 4.5666548075665885}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9092871300864493, "5": 0.08375206934376035, "3": 0.006955309181706881, "2": 5.2031882253432994e-06, "1": 9.430043824206828e-08}, "score": 4.076786085773065}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6683141510448546, "4": 0.33117663680727666, "3": 0.0005086090048306381, "2": 5.405428092234133e-07, "1": 3.125751530240644e-08}, "score": 4.667804388112661}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9098487882833991, "5": 0.08512189422953131, "3": 0.005023575237833901, "2": 5.6312168635123485e-06, "1": 9.172700574545153e-08}, "score": 4.080086782923058}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8280281231638077, "5": 0.16749221607346998, "3": 0.00447329949764532, "2": 5.8539728942548285e-06, "1": 4.5247514657996807e-07}, "score": 4.163005860140094}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9905772559147216, "4": 0.009402801520629505, "3": 1.964688021378984e-05, "2": 1.8043251629905428e-07, "1": 6.6256649984036e-08}, "score": 4.990557097932137}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8893459180357425, "5": 0.10485466819726381, "3": 0.005794123874929262, "2": 5.187389364293483e-06, "1": 9.75759292969903e-08}, "score": 4.0990498773038135}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9765958410157359, "4": 0.02336620105798568, "3": 3.744557546902789e-05, "2": 3.7858811145427434e-07, "1": 1.1252212139609923e-07}, "score": 4.97655732144032}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8533835280269475, "4": 0.14650327438850672, "3": 0.00011294653418810139, "2": 2.0486963232122734e-07, "1": 0}, "score": 4.853270211158131}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7980461109949671, "3": 0.1939969774877945, "5": 0.007584936788251147, "2": 0.00036869824968355805, "1": 3.0122899130077564e-06}, "score": 3.8128414764860543}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8245591162812618, "4": 0.17490736291285788, "3": 0.000531956414292782, "2": 1.3205410750676018e-06, "1": 1.6338785240021632e-07}, "score": 4.824024094924432}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7387939275743859, "5": 0.2564903081693488, "3": 0.004713139653163103, "2": 2.3847577764942583e-06, "1": 7.157285177748546e-08}, "score": 4.251772226648414}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8329768735881731, "4": 0.16688064878558928, "3": 0.0001422660018852208, "2": 1.9648986196922402e-07, "1": 2.054740872627403e-08}, "score": 4.832834148456273}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.957680441527953, "4": 0.04225802510087105, "3": 6.13107109665114e-05, "2": 1.1141587668435136e-07, "1": 4.4493309828906286e-08}, "score": 4.957618838427341}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7971247164999148, "5": 0.17564292149511024, "3": 0.02717059382161636, "2": 6.051925373515122e-05, "1": 1.2230950323320665e-06}, "score": 4.148347623713428}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7686906393104084, "4": 0.23045264092964182, "3": 0.0008277168753799865, "2": 2.686156777985902e-05, "1": 1.8659280774221204e-06}, "score": 4.767803812959739}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9615725882529805, "4": 0.03828467474798838, "3": 0.00014228307482980307, "2": 2.7154390444043737e-07, "1": 8.418214439529633e-08}, "score": 4.961429603954519}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9550021759713225, "4": 0.0449125056833404, "3": 8.500674089256418e-05, "2": 1.6803139500035465e-07, "1": 6.480053353871066e-08}, "score": 4.954916713987232}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9206888031484362, "5": 0.05234829036411079, "3": 0.026854848420729494, "2": 0.00010581227758986302, "1": 1.4950319202675934e-06}, "score": 4.025277351269594}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6220161263321663, "3": 0.23336463304070523, "5": 0.14236155434338846, "2": 0.0022420274743810632, "1": 1.5356050380442433e-05}, "score": 3.9044667692792365}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8143334444023052, "5": 0.10858223139674274, "3": 0.07489748253788446, "2": 0.0021844600449271445, "1": 2.3228678347607116e-06}, "score": 4.029308861887405}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998335843646352, "4": 0.0016586630378618767, "3": 5.486779975093906e-06, "2": 1.926453492671132e-08, "1": 1.1180339533029198e-08}, "score": 4.998330260927146}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.999090261762975, "4": 0.000908875897054663, "3": 8.266693834743389e-07, "2": 6.926300532351924e-09, "1": 5.057052668163467e-09}, "score": 4.999089429735497}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9255383507089884, "4": 0.07433700520748707, "3": 0.00012412803310577587, "2": 4.7459169122430905e-07, "1": 2.582744889272139e-08}, "score": 4.925413210475546}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8423002052355328, "5": 0.14042191638000664, "3": 0.01726960947485823, "2": 8.19715020560904e-06, "1": 6.60776018505595e-08}, "score": 4.123135715071563}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9766000491762813, "4": 0.023336192439173967, "3": 6.350232744882003e-05, "2": 1.6037949280988216e-07, "1": 2.827621061846412e-08}, "score": 4.976536207081115}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7785970520747624, "4": 0.22001586975090714, "3": 0.001385724737542659, "2": 1.263938396972075e-06, "1": 5.0589641249499444e-08}, "score": 4.777208677931721}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9987948997172492, "4": 0.0012044045301865234, "3": 6.772048668422164e-07, "1": 0, "2": 0}, "score": 4.998794241037716}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7247652787465212, "4": 0.27385752214730436, "3": 0.001374248833569396, "2": 2.8196917147524444e-06, "1": 1.278212542685707e-07}, "score": 4.723385009062039}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6627980205041805, "5": 0.3353494354174189, "3": 0.0018509423337166166, "2": 1.5580726208759224e-06, "1": 4.778729632647147e-08}, "score": 4.33349523220416}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9702436727614419, "5": 0.021524664829695606, "3": 0.008218134846331224, "2": 1.3046045460045178e-05, "1": 3.968706214211252e-07}, "score": 4.013279248404622}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6870356059066356, "4": 0.3123381699810752, "3": 0.0006252862581774057, "2": 8.248980780510044e-07, "1": 5.0940731880364014e-08}, "score": 4.6864085595979414}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9879064825536041, "4": 0.012079759447018796, "3": 1.3633793923970284e-05, "2": 4.995785934424618e-08, "1": 1.8591636646650937e-08}, "score": 4.987892748051169}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7796319497141376, "4": 0.22007732876568048, "3": 0.0002902224093878042, "2": 3.809441730437995e-07, "1": 5.591931437024945e-08}, "score": 4.779340846170329}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8360225270737608, "3": 0.1581699327788303, "5": 0.00576496613222981, "2": 4.240844674004707e-05, "1": 1.8539725309958674e-07}, "score": 3.8475096632918633}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6111359869549354, "5": 0.38010040024054437, "3": 0.008734578418858887, "2": 2.828618599141321e-05, "1": 8.012290305295143e-07}, "score": 4.371306826072448}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8769533944853282, "5": 0.09074693323154354, "3": 0.03229170799927521, "2": 8.053369360530255e-06, "1": 4.650295397624294e-08}, "score": 4.058438971061035}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6589776764101898, "5": 0.3388246710282102, "3": 0.002194037116495194, "2": 3.4249420708964416e-06, "1": 1.7703913980077825e-07}, "score": 4.336623257442414}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8967488867481099, "3": 0.08093106791679924, "5": 0.022224206527928225, "2": 9.536575559284699e-05, "1": 4.124528255560108e-07}, "score": 3.9411011661722712}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7458672229062616, "5": 0.25137576189095767, "3": 0.0027509169129109586, "2": 5.87216598412679e-06, "1": 1.9093457630728559e-07}, "score": 4.248612536590853}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9655247751575151, "3": 0.018250854100889228, "5": 0.01608989248662273, "2": 0.0001325267561123911, "1": 1.6396659924673217e-06}, "score": 3.9975690651174864}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.868757942238403, "5": 0.10912466878674387, "3": 0.022048277457104578, "2": 6.851670320582654e-05, "1": 5.323972051338478e-07}, "score": 4.0869377661580355}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9764481713582417, "4": 0.023536567580379836, "3": 1.5119715553334484e-05, "2": 3.775594085465737e-08, "1": 1.5674353426285426e-08}, "score": 4.9764330149513745}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9530849440349681, "3": 0.04232772374214312, "5": 0.0033047878445770606, "2": 0.0012487490359672586, "1": 3.3449557505923524e-05}, "score": 3.958379202966141}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5901703529171856, "5": 0.40313576012716634, "3": 0.006670543087202735, "2": 2.1930657811936753e-05, "1": 1.1837892922101977e-06}, "score": 4.3964178953031885}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996939014577211, "4": 0.0003046402456499972, "3": 1.3270329134772167e-06, "1": 0, "2": 0}, "score": 4.999692705648186}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9931580044668731, "4": 0.0068054126873027514, "3": 3.611313169158329e-05, "2": 3.131332556830481e-07, "1": 0}, "score": 4.993121420572494}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5477801273559713, "4": 0.4505486574986565, "3": 0.0016643420480247988, "2": 6.444548360364067e-06, "1": 1.7737086747070905e-07}, "score": 4.5461025012676215}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9729818973050391, "3": 0.016755674532896933, "5": 0.010089631162923222, "2": 0.0001701222945223862, "1": 2.198761083695031e-06}, "score": 3.9929871124199923}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8257906565636537, "4": 0.17218694549427777, "3": 0.0020198096594576946, "2": 2.3615957551228883e-06, "1": 9.621351505550134e-08}, "score": 4.823765942551636}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7118296299366048, "4": 0.28791251855685757, "3": 0.00025734396054645655, "2": 4.321137384094816e-07, "1": 3.168907033182591e-08}, "score": 4.711571357807766}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7761298347282548, "4": 0.22294416946747447, "3": 0.0009254134012691534, "2": 4.849180157444078e-07, "1": 2.9011109329177573e-08}, "score": 4.775203417538809}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6555034058415777, "4": 0.3422231394990368, "3": 0.0022700282559754916, "2": 3.1045244826227087e-06, "1": 1.2089940509193644e-07}, "score": 4.65322693712366}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9683825921188807, "5": 0.025380467420045984, "3": 0.006224665332026773, "2": 1.2198116541346668e-05, "1": 7.341974001126275e-08}, "score": 4.01913118566445}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9933945266879264, "4": 0.006551617586850698, "3": 5.339384931494919e-05, "2": 3.5041751268823493e-07, "1": 1.0555802871826596e-07}, "score": 4.9933401211905695}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9982926071564137, "4": 0.0016552917528162999, "3": 5.165756017113793e-05, "2": 2.8291566139243437e-07, "1": 1.9415694696053293e-07}, "score": 4.9982397678111115}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8511522834015166, "4": 0.1432795158906065, "3": 0.00554408602743955, "2": 2.2917104610315264e-05, "1": 1.1765066222771248e-06}, "score": 4.845558851460242}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903766892808408, "4": 0.00955051021750364, "3": 7.2347692425359e-05, "2": 3.260047125530447e-07, "1": 7.688223510971227e-08}, "score": 4.990303508370497}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.827765108690106, "4": 0.17095163478502917, "3": 0.0012760252574699443, "2": 6.765198192653543e-06, "1": 5.149703555388084e-07}, "score": 4.826473967709654}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7037581632153413, "5": 0.2870128473324039, "3": 0.009216711272509477, "2": 1.1732790843807127e-05, "1": 3.3413758421555323e-07}, "score": 4.2777717267450965}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9300192817362788, "5": 0.059809456205506525, "3": 0.010087038460890829, "2": 8.355361803754113e-05, "1": 5.05389711167648e-07}, "score": 4.0495538024954465}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7928993884394661, "5": 0.19869629019125373, "3": 0.008396701742015756, "2": 7.3836164906390044e-06, "1": 7.561176077901888e-08}, "score": 4.19028462490244}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9278215536608693, "4": 0.07210210785204901, "3": 7.612087656767214e-05, "2": 2.1077239128298676e-07, "1": 1.0181433707837852e-08}, "score": 4.927744977593477}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9660066603704128, "4": 0.03396431378958179, "3": 2.887134434233476e-05, "2": 1.0083120054370507e-07, "1": 0}, "score": 4.9659776392023405}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8794733293949767, "5": 0.11320604653719883, "3": 0.007317997895234624, "2": 2.5248257689847574e-06, "1": 1.4920346777218187e-08}, "score": 4.105882963380477}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.994744524587874, "4": 0.005248310834287004, "3": 7.17168445487348e-06, "2": 1.6949355965118944e-08, "1": 0}, "score": 4.994737295075335}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9762455491187167, "4": 0.02372727852759067, "3": 2.7028545762301074e-05, "2": 4.628735607880915e-08, "1": 1.2718426366665747e-08}, "score": 4.976218472628387}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9954527893108831, "4": 0.004545408392745043, "3": 1.7689374541952714e-06, "2": 3.9650078580811e-09, "1": 2.429350255294677e-09}, "score": 4.995451031997261}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9421650136695828, "4": 0.05768813264607515, "3": 0.00014665583129254306, "2": 1.2654662748177955e-07, "1": 1.4847608922231638e-08}, "score": 4.942018113387432}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5795353309912379, "5": 0.37301321164716644, "3": 0.04720338371891945, "2": 0.00024016364807710934, "1": 7.4881034758068645e-06}, "score": 4.325307173565875}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9032608074097054, "4": 0.09647212234402011, "3": 0.00026650647985528334, "2": 4.199941728214027e-07, "1": 1.0894953974777454e-07}, "score": 4.902993165537552}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7340003305699085, "4": 0.26504596903053523, "3": 0.0009529634572581313, "2": 7.242190029784028e-07, "1": 6.772618174215906e-08}, "score": 4.733045675176471}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9460028218562335, "4": 0.05386879560360967, "3": 0.0001274067287865476, "2": 6.933755953119312e-07, "1": 1.9028650110000532e-07}, "score": 4.945873544678313}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7963954022304971, "5": 0.19675243807905576, "3": 0.006823677701853111, "2": 2.804867960525407e-05, "1": 4.754174864940517e-07}, "score": 4.189871228770341}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9459775393226686, "3": 0.03540836455108192, "5": 0.018584131640490956, "2": 2.9686386032179763e-05, "1": 2.018084210933299e-07}, "score": 3.983115787603963}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.992823003533575, "4": 0.007165020905365339, "3": 1.1832589633491293e-05, "2": 5.035988053465221e-08, "1": 1.3975081305462374e-08}, "score": 4.992811106370093}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9962628558699929, "4": 0.003732014913090749, "3": 5.149314288590988e-06, "2": 9.002747755859845e-09, "1": 0}, "score": 4.996257659558991}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.986876293766568, "4": 0.013111651717658102, "3": 1.1874384986443897e-05, "2": 4.355174785543971e-08, "1": 6.43301829880741e-09}, "score": 4.986864441415511}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5844709499438511, "5": 0.41431600467619245, "3": 0.0012114738533350244, "2": 1.4339710561304407e-06, "1": 2.967027897774954e-08}, "score": 4.413101618437494}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8521704955710478, "5": 0.13720360342563576, "3": 0.010619004561503168, "2": 6.592011637244293e-06, "1": 1.998729344609073e-07}, "score": 4.126570828455952}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5509462084017859, "4": 0.44743280901186716, "3": 0.0016156474577757312, "2": 5.041519667500261e-06, "1": 2.3209431911240692e-07}, "score": 4.549319815412897}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7729950144711921, "4": 0.22651729032428639, "3": 0.0004873956703344731, "2": 2.553243855565945e-07, "1": 2.98746363247188e-08}, "score": 4.772507029602194}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9094655497237665, "4": 0.09039172078633997, "3": 0.00014214086287280285, "2": 4.047780276366798e-07, "1": 7.64432654011269e-08}, "score": 4.909322467641484}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8607060312272292, "5": 0.1354064476989502, "3": 0.003881137493052064, "2": 6.258224745822228e-06, "1": 1.0734069451327105e-07}, "score": 4.131512474103563}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8112891039743301, "3": 0.18647072923825772, "5": 0.0021355757425797176, "2": 0.0001042979344588252, "1": 2.435077664160394e-07}, "score": 3.815455510958217}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7966366032045968, "4": 0.20244423764723687, "3": 0.0009177932597048001, "2": 1.3155364878271258e-06, "1": 4.8238470069867065e-08}, "score": 4.795716035838254}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7077922079227852, "4": 0.2919838168489116, "3": 0.00022389911209486706, "2": 1.2543827901819643e-07, "1": 1.0389917211098353e-08}, "score": 4.70756798451409}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8244023907352993, "5": 0.17455320222437012, "3": 0.0010430175256381728, "2": 1.387047736689463e-06, "1": 1.4899502705824379e-08}, "score": 4.173507363747611}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9705363161810266, "4": 0.029431345474317836, "3": 3.21903931277186e-05, "2": 8.908463179557248e-08, "1": 1.7195433200161008e-08}, "score": 4.970503936474655}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8442026977583127, "4": 0.15534839107060933, "3": 0.00044745839349590147, "2": 1.1740714242921082e-06, "1": 2.875347829077579e-07}, "score": 4.843752021168449}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5779916250197167, "4": 0.4204902443319892, "3": 0.0015159231282601592, "2": 1.953923803973223e-06, "1": 1.7698143444768659e-07}, "score": 4.576471307265776}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9669550273542036, "4": 0.03296976993279618, "3": 7.502403718318227e-05, "2": 8.966556789920265e-08, "1": 6.610840118871026e-08}, "score": 4.966879647804012}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9773129929354472, "4": 0.022648501232342067, "3": 3.827219134655141e-05, "2": 1.4930210998241848e-07, "1": 3.2418357016745495e-08}, "score": 4.977274375625283}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9096275890828633, "4": 0.09028032744911521, "3": 9.157429023234273e-05, "2": 3.7825396569892206e-07, "1": 5.377850418956634e-08}, "score": 4.909535167115568}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7863118181657567, "5": 0.21096635778405343, "3": 0.0027203383854408226, "2": 1.3909480401974322e-06, "1": 1.2543263442264496e-07}, "score": 4.208242854808257}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.970975214270124, "4": 0.02901266268461426, "3": 1.2048757685276352e-05, "2": 3.297289422910124e-08, "1": 1.9002448455567358e-08}, "score": 4.9709630642236595}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8814775459636084, "4": 0.1182425329386626, "3": 0.00027841938552881077, "2": 9.913065663013108e-07, "1": 4.988284938363176e-07}, "score": 4.881195657681191}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9989820008130994, "4": 0.0010172060263341214, "3": 7.515027262616116e-07, "2": 6.552219432746684e-09, "1": 0}, "score": 4.998981271275792}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5327884702027285, "5": 0.46652161283673893, "3": 0.0006887515135278247, "2": 1.0525308085887464e-06, "1": 7.804174196522593e-08}, "score": 4.465830538381953}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "human", "scores": {"4": 0.882474875736803, "5": 0.09316787551714191, "3": 0.024322379144587344, "2": 3.4273983162065915e-05, "1": 4.419274979989337e-07}, "score": 4.068775633193919}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9939849665848947, "4": 0.006004739529467588, "3": 1.008403578453514e-05, "2": 1.2300682442291437e-07, "1": 0}, "score": 4.993974722855236}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8451878234943592, "4": 0.15418957918505288, "3": 0.000622213423176951, "2": 3.533923231966739e-07, "1": 0}, "score": 4.8445649290500645}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8550692663943962, "4": 0.14481183050288315, "3": 0.00011856941361283845, "2": 2.80931350986089e-07, "1": 2.3271858407846423e-08}, "score": 4.854950090511477}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9451676989746381, "4": 0.05479063465990478, "3": 4.135902092791163e-05, "2": 2.3381935661422963e-07, "1": 2.582339430153893e-08}, "score": 4.9451258399289975}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9145637256329996, "4": 0.0851735448346157, "3": 0.0002626595108769103, "2": 1.2215159275387517e-07, "1": 1.1645092387256158e-08}, "score": 4.914300728573969}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8907536471799493, "4": 0.10871933780363581, "3": 0.0005259754601616275, "2": 9.320503501070861e-07, "1": 5.82070124869964e-08}, "score": 4.890225676885188}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.797263213007063, "5": 0.20023391917570188, "3": 0.0025008380081901213, "2": 2.0726594848804506e-06, "1": 2.639548141410677e-08}, "score": 4.197728842970182}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9889363750871362, "4": 0.01105453199286369, "3": 9.005941786168705e-06, "2": 3.715130271666539e-08, "1": 7.766377480550204e-09}, "score": 4.988927313138424}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9921043893838126, "4": 0.007890841467009111, "3": 4.7442319695706025e-06, "2": 1.6237880854212112e-08, "1": 4.4369040045452105e-09}, "score": 4.992099603574276}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9069369555935388, "3": 0.06866054866099708, "5": 0.024292821106476868, "2": 0.00010856787549268264, "1": 9.325025041653833e-07}, "score": 3.95541233141709}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.852638559409377, "5": 0.09325826422391253, "3": 0.05406420268686755, "2": 3.82557378420294e-05, "1": 6.15570719671092e-07}, "score": 4.0391157073535275}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8444881625020663, "4": 0.15479566842014758, "3": 0.0007155512022734074, "2": 4.91099049182806e-07, "1": 4.386351306162513e-08}, "score": 4.843771567470745}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6470349612539081, "4": 0.3523750808869366, "3": 0.0005886245581785678, "2": 1.1725836451774056e-06, "1": 1.1134526140594232e-07}, "score": 4.646443689408918}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9468074772332224, "4": 0.05304939597200855, "3": 0.0001427101368378309, "2": 2.4148680573113394e-07, "1": 0}, "score": 4.94666444995105}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9673617058354642, "4": 0.03261223350867416, "3": 2.6021485390971673e-05, "2": 4.0585093213026916e-08, "1": 0}, "score": 4.96733560181147}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9590680090320233, "4": 0.04066062904685945, "3": 0.00027076967668148333, "2": 4.809502512232337e-07, "1": 6.506428862987542e-08}, "score": 4.958796126587019}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5812052931787318, "5": 0.41555094952581273, "3": 0.0032363795396428753, "2": 7.056615587068328e-06, "1": 8.063556755256831e-08}, "score": 4.41230031400844}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9895079783108159, "4": 0.01047858110499654, "3": 1.3279075928955907e-05, "2": 9.698252784275194e-08, "1": 0}, "score": 4.98949456911769}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9954207747699076, "4": 0.004571851563512299, "3": 7.2594608134893315e-06, "2": 4.14794380985152e-08, "1": 0}, "score": 4.995413504742988}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8593174479740183, "5": 0.13613322188915106, "3": 0.0045449616010602096, "2": 4.263999450373548e-06, "1": 8.27875623502132e-08}, "score": 4.131579486788193}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6370102961753636, "4": 0.3620835473502259, "3": 0.0009050964910528045, "2": 9.934272535807971e-07, "1": 7.724806268456389e-08}, "score": 4.63610297428443}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9196981597497254, "5": 0.07268376023007658, "3": 0.007610160626791188, "2": 7.766227754140776e-06, "1": 6.596661870931339e-08}, "score": 4.065057874920905}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9963609496512925, "4": 0.003635525906207821, "3": 3.5149614501576806e-06, "2": 2.069478708567288e-08, "1": 0}, "score": 4.996357382127378}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6936087349175638, "5": 0.3035983707230288, "3": 0.002787253713501898, "2": 5.615381663250897e-06, "1": 8.499120979331544e-08}, "score": 4.300799613306722}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9158153569583805, "4": 0.08393449548566956, "3": 0.0002497797570963954, "2": 3.24149826685277e-07, "1": 2.7558081637242865e-08}, "score": 4.915564860959691}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8060291023446484, "4": 0.19332673384053153, "3": 0.000642690041817935, "2": 1.4051043323994471e-06, "1": 7.494382530357812e-08}, "score": 4.805383372208783}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9164977249770525, "4": 0.08300418921411615, "3": 0.0004971966182200421, "2": 7.669095266256362e-07, "1": 6.150219326034527e-08}, "score": 4.9159988657065945}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9893896372651992, "4": 0.010586912611249081, "3": 2.3318698698268787e-05, "2": 7.497770756943049e-08, "1": 1.2806538194341496e-08}, "score": 4.989366173368012}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9615753402776662, "4": 0.0383346918634074, "3": 8.971056628657063e-05, "2": 1.235528298848404e-07, "1": 1.6267298033073955e-08}, "score": 4.961485446751936}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.796147108929594, "4": 0.20360354151145565, "3": 0.00024840501969430835, "2": 9.103570060773166e-07, "1": 7.126482280973343e-08}, "score": 4.795896639887524}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.985310180816296, "4": 0.014681824188412513, "3": 7.897920981693638e-06, "2": 4.9618950978927286e-08, "1": 0}, "score": 4.985302230415284}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8866467664320477, "4": 0.11311410398110881, "3": 0.0002379645131075785, "2": 7.443756675832266e-07, "1": 1.6786546196651066e-07}, "score": 4.88640703368382}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995024950966258, "4": 0.0004968096515987508, "3": 5.86890838199879e-07, "1": 9.423163280537094e-09, "2": 6.917329861112566e-09}, "score": 4.999501958076254}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5744668188110701, "5": 0.42394251956665485, "3": 0.001555051523214275, "2": 3.432066181076458e-05, "1": 8.455090203559927e-07}, "score": 4.4223164776709645}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5516917569484411, "4": 0.4324987252557914, "2": 0.008697816168031261, "5": 0.0070982074403622775, "1": 1.344723566238781e-05}, "score": 3.4379704500606225}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8489112269789603, "5": 0.1413616469908121, "3": 0.009714370451022627, "2": 1.2539009664511616e-05, "1": 1.8735080779999454e-07}, "score": 4.131621640313854}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7973695989349538, "4": 0.20207782166612234, "3": 0.00055175651776603, "2": 8.09020969461089e-07, "1": 5.5963675973596143e-08}, "score": 4.796816022935489}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9970756698078672, "4": 0.002922207368997855, "3": 2.0789138253408018e-06, "2": 1.5669651825532924e-08, "1": 0}, "score": 4.997073587711755}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9488944536980094, "4": 0.051058124456086124, "3": 4.712075480346426e-05, "2": 1.7705241823419815e-07, "1": 2.6927978444089734e-08}, "score": 4.948846990197633}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6498324620553161, "5": 0.346297758606047, "3": 0.0038582413813864702, "2": 1.1032798938493356e-05, "1": 3.1721660496191777e-07}, "score": 4.342416564331321}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9155281931353616, "4": 0.08429345975175502, "3": 0.000175816802485897, "2": 1.5240260616893615e-06, "1": 8.981515670320238e-07}, "score": 4.915346732805028}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5255385146048512, "5": 0.47195665039397405, "3": 0.0025020547116756044, "2": 2.5699785638662634e-06, "1": 1.846423733088824e-07}, "score": 4.4694489138481295}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.902807623310375, "4": 0.09704401893138918, "3": 0.00014780082021101146, "2": 4.938791427469873e-07, "1": 3.554021374601819e-08}, "score": 4.902658752951204}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9289451294628522, "4": 0.07097187550960049, "3": 8.257636965707272e-05, "2": 3.291043378947402e-07, "1": 0}, "score": 4.928861978067409}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9303677043088865, "5": 0.03747954730474851, "3": 0.032028194050929444, "2": 0.00012231278288565305, "1": 1.841330775880246e-06}, "score": 4.005201205777356}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.700186591621575, "4": 0.2993231859101852, "3": 0.0004895527689830121, "2": 6.44061898356789e-07, "1": 7.212767676119115e-08}, "score": 4.699695501816698}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9814583747468923, "4": 0.018484609722801672, "3": 5.671260848965262e-05, "2": 2.46224774677302e-07, "1": 8.816674375224229e-08}, "score": 4.98140087430423}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8662996622176045, "4": 0.13328383859439374, "3": 0.00041513719583238464, "2": 1.046918992635409e-06, "1": 2.373113131923314e-07}, "score": 4.865881786582428}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8789132744886451, "5": 0.11004245864301754, "3": 0.011030302730409797, "2": 1.3729757505413188e-05, "1": 2.495024754901127e-07}, "score": 4.09898394639333}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8810394547469339, "5": 0.07392973233049714, "3": 0.04480781557399447, "2": 0.00022163780887006135, "1": 1.2230375482164358e-06}, "score": 4.028674975940313}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7141971602191675, "4": 0.22150763955531516, "2": 0.06245240701992476, "5": 0.0015647248267540122, "1": 0.0002778572681615848}, "score": 3.161629001774184}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5325640909763735, "5": 0.4648935613123616, "3": 0.0025403688295732993, "2": 1.8975860112157285e-06, "1": 7.968455971249164e-08}, "score": 4.462349159001986}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6138846284732866, "4": 0.383708089144772, "3": 0.0024037929339094845, "2": 3.137441183427546e-06, "1": 3.332602902149098e-07}, "score": 4.6114735723391655}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5713059662608613, "5": 0.4275392422847842, "3": 0.0011502378866990162, "2": 4.219795039224534e-06, "1": 2.646072991619404e-07}, "score": 4.426379800476804}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9366531519028668, "5": 0.053346868512762, "3": 0.009992104978090796, "2": 7.660441031158077e-06, "1": 1.1174570926821808e-07}, "score": 4.043339111854253}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8616812209493987, "4": 0.13818820757217698, "3": 0.000130265354427288, "2": 3.159610153865466e-07, "1": 6.710763594265495e-08}, "score": 4.861550056058362}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6444015515104201, "4": 0.35427401910996337, "3": 0.0013234984598401321, "2": 8.074013148742305e-07, "1": 4.3948690872726903e-08}, "score": 4.643076357571315}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.978923517096854, "4": 0.021065123937369725, "3": 1.1299738207412143e-05, "2": 1.779367108315355e-08, "1": 0}, "score": 4.978912222331453}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7860806686099032, "5": 0.20951347958400943, "3": 0.004398319688382828, "2": 7.38859472563043e-06, "1": 2.392085670703018e-07}, "score": 4.2050996454553955}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8911124615534151, "5": 0.0844850485932112, "3": 0.02436132122820997, "2": 4.0227287463115174e-05, "1": 8.202726926164359e-07}, "score": 4.060040819240839}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.782295940101264, "4": 0.21727220730819793, "3": 0.0004315506815468523, "2": 2.386711915082838e-07, "1": 1.768523015919803e-08}, "score": 4.781863894637553}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.899064784733137, "4": 0.1008591792383022, "3": 7.594599973701329e-05, "2": 5.538084838399335e-08, "1": 0}, "score": 4.8989887591198436}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9356431034038526, "4": 0.06414254542826356, "3": 0.00021385999200928456, "2": 4.092805396589284e-07, "1": 4.743440631207321e-08}, "score": 4.935428314783273}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9260334702599733, "4": 0.07373269170881079, "3": 0.0002330797239610491, "2": 6.779949482448986e-07, "1": 9.742568058630764e-08}, "score": 4.925798726425533}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6735845181919051, "5": 0.32228816863597315, "3": 0.004125342220876398, "2": 1.8314272079800735e-06, "1": 0}, "score": 4.318159207951539}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9730785153123254, "4": 0.026908248599284045, "3": 1.306336252235023e-05, "2": 2.604927240102168e-08, "1": 0}, "score": 4.973065542577198}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.956916612116627, "5": 0.03244683744187019, "3": 0.01063488121122229, "2": 1.6740244169696321e-06, "1": 6.639461341611629e-09}, "score": 4.021808588014079}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9937553440178795, "4": 0.006243190057933437, "3": 1.4972971129130227e-06, "2": 2.963772164632278e-09, "1": 1.1664848641390271e-09}, "score": 4.9937538020123435}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7776805447411743, "4": 0.22177722321137183, "3": 0.0005418100929141413, "2": 3.733862239743328e-07, "1": 1.5149868271186844e-08}, "score": 4.777137968396953}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.925598808848598, "5": 0.04455841295092296, "3": 0.029786655135931556, "2": 5.5782910440094404e-05, "1": 3.822660518314829e-07}, "score": 4.014659044578634}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8211082227561296, "5": 0.17476134127047915, "3": 0.004128977010114825, "2": 1.33090818885845e-06, "1": 3.4423099528479306e-08}, "score": 4.1706296151510776}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9530791006890891, "3": 0.03067538615114535, "5": 0.016234093680891244, "2": 1.1338914356568108e-05, "1": 6.464409977550608e-08}, "score": 3.9855358355384576}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9236580200669783, "5": 0.07304293938561777, "3": 0.003297819455419936, "2": 1.1350600510686291e-06, "1": 0}, "score": 4.069742855810208}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7342217604828919, "5": 0.26182278426895106, "3": 0.003951596517827727, "2": 3.721778174458467e-06, "1": 7.50539986854856e-08}, "score": 4.257863534994056}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5942739325587464, "5": 0.40111999782278235, "3": 0.004602719290678526, "2": 2.9520019224199202e-06, "1": 2.0384702537750548e-07}, "score": 4.396510840100153}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8781933879293311, "4": 0.12169963234347472, "3": 0.00010671775632063755, "2": 1.871249989159136e-07, "1": 3.341249183002242e-08}, "score": 4.878086232067619}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5658643747927747, "5": 0.43309930303939076, "3": 0.0010359913340463052, "2": 3.021373867513286e-07, "1": 2.02145741523376e-08}, "score": 4.432062650451529}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.990619025475916, "4": 0.009374673822477446, "3": 6.209240327606632e-06, "2": 2.2506132709689628e-08, "1": 6.8384140242305465e-09}, "score": 4.990612812241712}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9022057235820298, "4": 0.0977021122903269, "3": 9.20421438940144e-05, "2": 6.88646398767346e-08, "1": 9.299194996963283e-09}, "score": 4.90211355534181}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8321411592432569, "5": 0.16525436269895685, "3": 0.0026003646338486476, "2": 3.913188668810237e-06, "1": 1.1831988387416737e-07}, "score": 4.162645830051315}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5515222150265626, "5": 0.4466891232661908, "3": 0.0017856514006237153, "2": 2.837579948133559e-06, "1": 1.1414731339386094e-07}, "score": 4.44489748032554}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9384830723864683, "5": 0.04974546377185265, "3": 0.011760474366944162, "2": 1.073203890787294e-05, "1": 9.236571286989197e-08}, "score": 4.037963254496553}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.947310975576726, "4": 0.05260000837594434, "3": 8.857729476109357e-05, "2": 3.4092852013783984e-07, "1": 2.1553513375916116e-08}, "score": 4.947221724009493}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8110036858952893, "5": 0.18647268719119395, "3": 0.0025202695976163656, "2": 3.3100210800513767e-06, "1": 8.061799091476496e-08}, "score": 4.183945549567796}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8249867857899799, "4": 0.17428423117465053, "3": 0.0007274487559181664, "2": 1.3336273464282795e-06, "1": 9.932982088027436e-08}, "score": 4.824256455305452}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6127075112888399, "4": 0.38443751999595965, "3": 0.0028535227367429473, "2": 1.4027471416407403e-06, "1": 6.234539654650039e-08}, "score": 4.609850984364884}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6169391390842138, "5": 0.3792683033324259, "3": 0.003791122991315197, "2": 1.359568755560616e-06, "1": 4.843713816512998e-08}, "score": 4.3754743258746025}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7402021384631553, "4": 0.25846026773499947, "3": 0.0013354699855280254, "2": 1.8339911677156892e-06, "1": 1.9215951549121877e-07}, "score": 4.7388624961782195}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6580660715551769, "4": 0.3413025335030152, "3": 0.0006306450963565199, "2": 6.701146632667087e-07, "1": 3.6511082219130476e-08}, "score": 4.657434005110351}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8277937001907325, "3": 0.16922804414609374, "5": 0.0024339033341900782, "2": 0.0005425306372232631, "1": 1.8262789899061845e-06}, "score": 3.832115319846806}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8205556387212255, "4": 0.178876706673392, "3": 0.0005655815862765551, "2": 1.7772230431195993e-06, "1": 1.303042156400678e-07}, "score": 4.819986247477257}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5085239323496217, "4": 0.4899884987949371, "3": 0.001482263452038298, "2": 4.887346694494916e-06, "1": 2.422043610506628e-07}, "score": 4.507031256753748}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9296765769873125, "4": 0.0701474025643104, "3": 0.0001752975048040595, "2": 5.819623977378838e-07, "1": 7.457854288479251e-08}, "score": 4.929499953543329}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6187203719270272, "4": 0.3700006413377866, "3": 0.01111771385361102, "2": 0.00015558910001362632, "1": 5.3925725764370075e-06}, "score": 4.607275478999735}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9027061985715374, "5": 0.08499923691523005, "3": 0.012278252143312548, "2": 1.5947667143917118e-05, "1": 2.6814230729375804e-07}, "score": 4.0726882920295235}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5474808473020946, "5": 0.4498835848589115, "3": 0.0026273298885795713, "2": 7.967769231591797e-06, "1": 1.6345420133621341e-07}, "score": 4.447239876801827}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8491324905643224, "4": 0.15046138587088279, "3": 0.00040485899984757845, "2": 1.0539453070878188e-06, "1": 2.3604272740070424e-07}, "score": 4.848724793968474}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.757280706409439, "5": 0.23944021919250166, "3": 0.00327018572189253, "2": 8.550169078055179e-06, "1": 1.635034084561157e-07}, "score": 4.236152483949781}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.881534887943001, "5": 0.11594272034031322, "3": 0.002519815485951565, "2": 2.49082892818995e-06, "1": 3.69321644598928e-08}, "score": 4.113417817897332}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5212013727026378, "5": 0.47474213312048497, "3": 0.004044663180691878, "2": 1.1381082622541814e-05, "1": 3.846877002559153e-07}, "score": 4.470673584411538}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9964546947880021, "4": 0.003523547444941751, "3": 2.146353734505249e-05, "2": 1.651709233711644e-07, "1": 7.856928421160008e-08}, "score": 4.99643271551035}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8660543349079415, "4": 0.1336451935509161, "3": 0.0002998815483832216, "2": 4.5591611622539707e-07, "1": 1.8265478123668103e-08}, "score": 4.865753586994822}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948059841905312, "4": 0.005186538811203904, "3": 7.401017997395821e-06, "2": 5.017213720976964e-08, "1": 0}, "score": 4.994798508502149}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9973132253571052, "4": 0.0026853666645258525, "3": 1.4516423316066676e-06, "2": 8.991986905814869e-09, "1": 4.292412104050985e-09}, "score": 4.997311686058296}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8714434537047772, "5": 0.08452117367267038, "3": 0.04390382205212382, "2": 0.00012914018993485498, "1": 2.1909967076983917e-06}, "score": 4.040352507103239}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9458090246513552, "4": 0.05401300111539676, "3": 0.00017637105767324973, "2": 1.2371811899218302e-06, "1": 2.689538589833792e-07}, "score": 4.945629464134106}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7378556866854896, "5": 0.2568470775950122, "3": 0.005290932884408891, "2": 5.7330894586479775e-06, "1": 3.0964418159564414e-07}, "score": 4.251543815026053}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6878718107452664, "5": 0.31006113229279364, "3": 0.002062907259698895, "2": 3.943515395881392e-06, "1": 2.430443256884628e-07}, "score": 4.307989597517604}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9964118538368829, "4": 0.0035841081806207674, "3": 4.00140703478788e-06, "2": 2.614334950011281e-08, "1": 0}, "score": 4.996407810537787}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9090007951977821, "5": 0.08833687925149122, "3": 0.00266021588422154, "2": 2.0586029187962134e-06, "1": 3.01801926578654e-08}, "score": 4.085672457409986}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.678103464619987, "5": 0.32031583037534206, "3": 0.0015791755056689253, "2": 1.5518139825360408e-06, "1": 1.8908524212950176e-08}, "score": 4.318733481376825}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6671585334325965, "4": 0.33224248505141213, "3": 0.0005983933166896393, "2": 5.590695236823686e-07, "1": 2.6087906043177814e-08}, "score": 4.666558945740729}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7510356562371425, "4": 0.2487816686228911, "3": 0.00018224456667550318, "2": 4.391815306014305e-07, "1": 1.6181147612310828e-08}, "score": 4.75085246615079}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8789047227040888, "3": 0.07775573255731937, "5": 0.04265345927042599, "2": 0.0006807240138248791, "1": 5.341612416044166e-06}, "score": 3.96352025312438}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7927131186110572, "5": 0.19930925805146799, "3": 0.007972504457267033, "2": 4.940216014939134e-06, "1": 1.1510719641721997e-07}, "score": 4.191326540000722}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7956440392718654, "4": 0.2039777009869648, "3": 0.00037751120786776177, "2": 6.708300572072086e-07, "1": 7.279023684566989e-08}, "score": 4.795264971940316}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8368514611601964, "4": 0.16294057747661886, "3": 0.00020772447412680366, "2": 9.778829011985677e-08, "1": 1.9605082364740506e-08}, "score": 4.8366435822695415}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9321038252670447, "4": 0.06772335369372862, "3": 0.00017178781094996691, "2": 8.044862194465193e-07, "1": 1.1563201184138637e-07}, "score": 4.931930186998287}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8001548320325338, "4": 0.1993510177152018, "3": 0.0004929368428191524, "2": 1.1152521891687953e-06, "1": 8.66723430511304e-08}, "score": 4.799659413852326}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7363099287834198, "5": 0.2525568012802715, "3": 0.011016457366888817, "2": 0.00011180715512074979, "1": 4.964390635616657e-06}, "score": 4.2413018463303205}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9249613464171274, "4": 0.074649593531628, "3": 0.0003879974851244586, "2": 9.97868832134177e-07, "1": 6.55988940586843e-08}, "score": 4.924571155564058}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8769725473566123, "4": 0.12253646742915365, "3": 0.0004900988267259078, "2": 8.490141365068606e-07, "1": 5.47987200509338e-08}, "score": 4.876480570832473}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9922840509517387, "4": 0.0077050817521022025, "3": 1.066676206797497e-05, "2": 1.0542099785977242e-07, "1": 0}, "score": 4.992273267725856}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7886397918188383, "5": 0.1929330194103957, "3": 0.01839971322659121, "2": 2.713649654869836e-05, "1": 2.077257784291608e-07}, "score": 4.174478432926202}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7686009767770017, "4": 0.23114059898502545, "3": 0.00025825321522335336, "2": 9.72863641420787e-08, "1": 6.523896609691443e-09}, "score": 4.768342561059575}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9182418223611913, "5": 0.0758573254299935, "3": 0.005898088285398984, "2": 2.7134138299506863e-06, "1": 4.3130734349995296e-08}, "score": 4.06995368144091}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6956673836023517, "4": 0.30412100926096725, "3": 0.0002114730480470065, "2": 1.0795147676454596e-07, "1": 0}, "score": 4.695455712828587}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8145692443538824, "4": 0.18535036131893526, "3": 8.022535066170251e-05, "2": 8.616842721320896e-08, "1": 7.723555669444988e-09}, "score": 4.814488884651221}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7009082604887057, "5": 0.2984305310605151, "3": 0.0006609264467650677, "2": 3.42439101805757e-07, "1": 1.091712696160851e-08}, "score": 4.297768865737697}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8289449759951931, "5": 0.1602948254979893, "3": 0.010743038667325124, "2": 1.6871141486542786e-05, "1": 3.37402586799891e-07}, "score": 4.149517025057767}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6591982863372555, "5": 0.3327084493424179, "3": 0.008072037905642655, "2": 2.089388553355747e-05, "1": 3.8921342242961707e-07}, "score": 4.324593437626098}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8164506902547327, "4": 0.1829303499415704, "3": 0.0006181354189477066, "2": 7.870122682679518e-07, "1": 3.858624388611613e-08}, "score": 4.81583086406229}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8691897527138053, "5": 0.09917936504385212, "3": 0.03159158472581954, "2": 3.895926285221381e-05, "1": 3.4833331982343765e-07}, "score": 4.067508816111903}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9215971274146111, "3": 0.053670198192587705, "5": 0.024677403305655925, "2": 5.4805335807518234e-05, "1": 3.0898719532035194e-07}, "score": 3.9708966629175078}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8733457442699094, "3": 0.08536840598282035, "5": 0.041228034706057966, "2": 5.739909622337958e-05, "1": 4.988162726879281e-07}, "score": 3.955743337749579}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.954319803418161, "4": 0.045624669999194775, "3": 5.536172984183879e-05, "2": 7.463278119870808e-08, "1": 1.694942376267835e-08}, "score": 4.954264311494002}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8566654328627957, "5": 0.1374734735669452, "3": 0.005859486542300336, "2": 1.5159549311179833e-06, "1": 2.8983358978210426e-08}, "score": 4.1316108763363815}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9930623002291636, "4": 0.006929802260678838, "3": 7.818084361315219e-06, "2": 1.4633623157175422e-08, "1": 0}, "score": 4.993054517219716}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9116565315370179, "4": 0.08778757527755002, "3": 0.0005554381478991038, "2": 4.269307563424862e-07, "1": 0}, "score": 4.9111002651356985}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9448838680429011, "3": 0.03305024168510449, "5": 0.022055087016525195, "2": 1.0473817357100942e-05, "1": 1.7814820869197298e-07}, "score": 3.9889833615853743}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9525180843188439, "4": 0.047408070550311675, "3": 7.362705534363785e-05, "2": 1.066563343480012e-07, "1": 5.3274076164196327e-08}, "score": 4.952444139508555}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7860154816430703, "5": 0.20909250861389195, "3": 0.00489041799303612, "2": 1.566668762737049e-06, "1": 6.346457250794433e-08}, "score": 4.204198759051785}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9600955329325365, "4": 0.03988752741779042, "3": 1.6766193342411964e-05, "2": 2.153263813714143e-08, "1": 0}, "score": 4.960078869532645}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8250311630227025, "4": 0.1746443427815471, "3": 0.0003239935337282368, "2": 3.168989131139416e-07, "1": 9.294452752340791e-08}, "score": 4.824706331756223}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "human", "scores": {"4": 0.745636174116877, "5": 0.24917919069243788, "3": 0.005177539166354095, "2": 6.805843340516132e-06, "1": 1.756369072268883e-07}, "score": 4.24398754087601}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9889431354793032, "4": 0.011049525423944396, "3": 7.1375926666366075e-06, "2": 5.118542568564489e-08, "1": 0}, "score": 4.988936044171325}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9751399673803199, "4": 0.024837670661636925, "3": 2.2234487133440818e-05, "2": 5.0762091055596596e-08, "1": 1.2964512757952572e-08}, "score": 4.975117654633664}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9053320196699626, "4": 0.09461121104089666, "3": 5.6423433396331815e-05, "2": 2.036937900381304e-07, "1": 5.0444959799692795e-08}, "score": 4.905275120543221}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.591233373796579, "4": 0.40827035059866573, "3": 0.0004954973263854548, "2": 7.860023929941661e-07, "1": 4.03555865306958e-08}, "score": 4.590736154996284}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6018072907224932, "4": 0.3926550648883325, "3": 0.005532978504702843, "2": 4.506120383697797e-06, "1": 1.5859358123035406e-07}, "score": 4.596264824894212}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9809665724223906, "4": 0.018896202557270318, "3": 0.00013568561535791558, "2": 1.3147973640342062e-06, "1": 2.614405294883728e-07}, "score": 4.980827436763985}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8564048919990964, "4": 0.14275755602113901, "3": 0.0008366383162841531, "2": 7.327725377987762e-07, "1": 1.6791415000990628e-07}, "score": 4.855566295497793}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9964053363282624, "4": 0.0035868603982261915, "3": 7.773251598329762e-06, "2": 5.6486509342718544e-08, "1": 2.1874593231654278e-08}, "score": 4.996397336314826}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8551348099655905, "4": 0.14420110372995584, "3": 0.0006610493905175807, "2": 2.798651119204148e-06, "1": 1.8743288542749903e-07}, "score": 4.85446764440671}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5470465607399221, "3": 0.44376108864896907, "5": 0.005783414654843579, "2": 0.003396193613289136, "1": 1.2643048746881119e-05}, "score": 3.555191965466185}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6154339501508079, "4": 0.3832316125775858, "3": 0.0013287305051324218, "2": 5.425247703222139e-06, "1": 1.60739949232182e-07}, "score": 4.614093961099967}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6534783668403967, "5": 0.34297908855042863, "3": 0.0035361433318599348, "2": 5.927749072895966e-06, "1": 2.4423059413719106e-07}, "score": 4.33943043485924}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998675636144865, "4": 0.0013213213768832463, "3": 2.969900818950586e-06, "2": 2.297782997526817e-08, "1": 1.153303858605274e-08}, "score": 4.998672623705306}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6775980116834898, "4": 0.3215296871709507, "3": 0.000869658458352792, "2": 2.547518015600384e-06, "1": 1.0390113655181994e-07}, "score": 4.676722940576588}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6672749961185923, "4": 0.3313865036750057, "3": 0.0013373083221581645, "2": 1.102308434806674e-06, "1": 6.120420136680648e-08}, "score": 4.665935318460617}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9434245420513246, "4": 0.05652061161560079, "3": 5.477898077988715e-05, "2": 2.630070742067281e-08, "1": 0}, "score": 4.943369749195956}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9795866578449411, "4": 0.020313306806020035, "3": 9.977289547106146e-05, "2": 1.9231580470026823e-07, "1": 4.01942052388143e-08}, "score": 4.9794864090645525}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9995461927016951, "4": 0.0004505619394102503, "3": 3.1413560129721996e-06, "2": 4.442337686923793e-08, "1": 4.2894209363278605e-08}, "score": 4.999542850493967}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9992230709058229, "4": 0.0007745103769036586, "3": 2.302320570442695e-06, "2": 1.8862990673811115e-08, "1": 1.1350171307058424e-08}, "score": 4.999220782925143}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6187325299017873, "5": 0.37577158758875806, "3": 0.005487258009773252, "2": 7.92115919375566e-06, "1": 5.567347067379216e-07}, "score": 4.370266871339741}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9864377523534342, "4": 0.013536019980751648, "3": 2.6045240833163097e-05, "2": 6.167044698226522e-08, "1": 3.073357904891283e-08}, "score": 4.986411580368683}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8882124936193251, "5": 0.10235900380565222, "3": 0.009426513264203733, "2": 1.92761320830787e-06, "1": 3.024142995141256e-08}, "score": 4.092928547513919}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9765728727282477, "4": 0.02340387434557539, "3": 2.3137682325714378e-05, "2": 4.538428214967164e-08, "1": 1.2455008571935862e-08}, "score": 4.976549662970737}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9892695761815931, "4": 0.010723425837487607, "3": 6.868443789670252e-06, "1": 1.3735460369192806e-08, "2": 1.2618851377771484e-08}, "score": 4.989262743368638}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.614309368645408, "3": 0.3738467780011974, "5": 0.007275643618070039, "2": 0.004550697777887077, "1": 1.743543375047753e-05}, "score": 3.624275135007995}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7790786230711476, "4": 0.22052303994663267, "3": 0.0003968125718364042, "2": 1.185414565801845e-06, "1": 9.509218951002315e-08}, "score": 4.778679344316327}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6077299237879861, "4": 0.3880349756475566, "3": 0.004229294858238471, "2": 5.789492044619259e-06, "1": 6.973078068147193e-08}, "score": 4.603488808456643}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.858940144386664, "4": 0.14051771679120478, "3": 0.000539571635932616, "2": 2.466890764687339e-06, "1": 1.1545811655259302e-07}, "score": 4.858395279579276}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.974219800435982, "4": 0.02573092250621177, "3": 4.9015744261692956e-05, "2": 1.5534770100903887e-07, "1": 2.7226719806586065e-08}, "score": 4.974170469021488}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5668897945607114, "4": 0.4290615916841645, "3": 0.004037250855312086, "2": 1.0794605924896138e-05, "1": 5.468528956687432e-07}, "score": 4.562829326002482}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9825813094038457, "4": 0.017378115400123868, "3": 4.0467353311174856e-05, "2": 1.0616864675740954e-07, "1": 5.019692836846329e-08}, "score": 4.982540431446787}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6393889527701149, "5": 0.3566897224144545, "3": 0.003916942907393084, "2": 4.139705118828292e-06, "1": 2.3931049162826294e-07}, "score": 4.352763783185693}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7171985492859986, "4": 0.28184263379277613, "3": 0.0009577172209767566, "2": 1.0443049640510243e-06, "1": 8.53781178712902e-08}, "score": 4.716238465845882}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5768354125760055, "5": 0.42202340685638884, "3": 0.001139126543683992, "2": 2.0076935145108196e-06, "1": 8.641582657154714e-08}, "score": 4.420879988807045}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "human", "scores": {"4": 0.894685570778211, "5": 0.05470373994246247, "3": 0.05057396807460296, "2": 3.6421583709504935e-05, "1": 3.4121996806168954e-07}, "score": 4.004055904871814}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.79067115571521, "5": 0.10399873951107816, "3": 0.10035053223169932, "2": 0.004864234130958892, "1": 0.00011508299433780408}, "score": 3.9935744883932642}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8946478650493901, "5": 0.07890313642651917, "3": 0.026441339590058552, "2": 7.616778855601593e-06, "1": 5.807503242269727e-08}, "score": 4.052446388218714}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7770331619911073, "4": 0.22216602861191082, "3": 0.0007976194132752082, "2": 3.0365122116396196e-06, "1": 1.5020557216533612e-07}, "score": 4.776229021471796}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6758065111629427, "5": 0.3096098569746373, "3": 0.014526481280472882, "2": 5.6035507817263014e-05, "1": 1.1855876489632141e-06}, "score": 4.29496772711637}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5496794988346095, "4": 0.4487517228351744, "3": 0.0015632087174838492, "2": 5.103209002147993e-06, "1": 4.3722277025050844e-07}, "score": 4.548104788025036}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6984358389361104, "4": 0.3004519614047532, "3": 0.0011110002981087198, "2": 1.094452849937554e-06, "1": 9.59105356786564e-08}, "score": 4.6973223682749525}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9751332779430886, "4": 0.02468161609795179, "3": 0.00018440686844553743, "2": 5.025403006150956e-07, "1": 8.167727708657834e-08}, "score": 4.974947732957319}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9947784892273818, "4": 0.005217231926586899, "3": 4.290698576225755e-06, "2": 1.613535515853326e-08, "1": 0}, "score": 4.994774138416456}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9791767307870979, "4": 0.020784380746703572, "3": 3.8835180819779556e-05, "2": 7.747589354544742e-08, "1": 2.0195015912273534e-08}, "score": 4.9791376366099005}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7657764443075316, "5": 0.2328369629895683, "3": 0.0013859025374321047, "2": 5.870052930723152e-07, "1": 1.2331609413793947e-08}, "score": 4.231449870468983}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6911065294640221, "3": 0.3031234289952203, "5": 0.005152710974460413, "2": 0.0006164455872507594, "1": 8.19601164309561e-07}, "score": 3.700793912439785}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.909487950136116, "5": 0.07540348385968774, "3": 0.015101448690424069, "2": 7.118930887962504e-06, "1": 8.438636504456901e-08}, "score": 4.060287538963454}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.534594886723708, "4": 0.46483275721121686, "3": 0.0005718415588340823, "2": 4.7474738283105814e-07, "1": 2.126500655474194e-08}, "score": 4.534022041751213}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.807539313194352, "5": 0.17945788904457546, "3": 0.012978449861396539, "2": 2.3725574471489964e-05, "1": 6.065388830893946e-07}, "score": 4.166430171044907}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9018669367811226, "5": 0.09647310636468653, "3": 0.0016593638051206948, "2": 6.513485050250445e-07, "1": 0}, "score": 4.0948124343350445}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5267461949286298, "5": 0.4721272180246254, "3": 0.0011261596209847947, "2": 4.502197680288839e-07, "1": 1.7140221514965394e-08}, "score": 4.471000087734414}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9767661810203927, "4": 0.023221244688340775, "3": 1.247615918502825e-05, "2": 2.7980443982022386e-08, "1": 0}, "score": 4.976753717421193}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.925260573554526, "5": 0.07336657709466618, "3": 0.0013724269637802008, "2": 3.282832612104176e-07, "1": 1.3902251938054224e-08}, "score": 4.071993457631592}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9291127272100985, "4": 0.07086456208139612, "3": 2.2587723663569728e-05, "2": 2.096121524349325e-08, "1": 0}, "score": 4.929090192353155}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9809753991993209, "4": 0.018975217373160998, "3": 4.908308910021639e-05, "2": 2.4952418314975e-07, "1": 9.707819977371564e-08}, "score": 4.980925480445753}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6499738809848808, "3": 0.2870910115723108, "5": 0.055030758753943955, "2": 0.00783383426360058, "1": 7.037883353653188e-05}, "score": 3.752060908535333}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9523455979604531, "4": 0.04753420603766102, "3": 0.00011996278359414788, "2": 1.3838723924509695e-07, "1": 2.1418345838546916e-08}, "score": 4.952225364052783}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9807725220961415, "4": 0.0191770639494713, "3": 5.013836873337568e-05, "2": 2.929247754414938e-07, "1": 5.523190839700018e-08}, "score": 4.980721561010157}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9878615713699781, "4": 0.0121203841899816, "3": 1.78812657381532e-05, "2": 9.180564948340377e-08, "1": 2.8345884070814394e-08}, "score": 4.987843463955049}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7725801125661809, "3": 0.22383068130164108, "5": 0.0033726651549720456, "2": 0.0002152444928252493, "1": 1.1202989372634607e-06}, "score": 3.7791080950529303}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7069008947982824, "5": 0.28096701524728174, "3": 0.012124428224654859, "2": 7.482070496022815e-06, "1": 1.9167070796589583e-07}, "score": 4.268827044640517}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8742024447499837, "5": 0.10570241908908007, "3": 0.020061155418027516, "2": 3.326492564517123e-05, "1": 5.034250469101218e-07}, "score": 4.085573241719712}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6243558192319595, "4": 0.3748148531002796, "3": 0.000826929015798443, "2": 2.0879454787386584e-06, "1": 1.5011922878744122e-07}, "score": 4.623524364097584}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9131883515932485, "5": 0.06041769218276269, "3": 0.026363692486604872, "2": 2.9934466969771325e-05, "1": 2.375568199953154e-07}, "score": 4.033993421209416}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.765787226515774, "4": 0.23376760456551712, "3": 0.000444607583355308, "2": 5.553790407512212e-07, "1": 1.668311010937914e-08}, "score": 4.765341449915345}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9915302352840923, "4": 0.008459332577707852, "3": 1.0376924656416463e-05, "2": 1.6855665587770163e-08, "1": 0}, "score": 4.991519862680701}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9919807302868467, "4": 0.00801413837707489, "3": 5.122084873200693e-06, "2": 4.067830606962967e-09, "1": 2.421736480913941e-09}, "score": 4.9919755955405805}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.968873594532014, "4": 0.031114224031476137, "3": 1.2084208987818292e-05, "2": 2.0678320589687514e-08, "1": 5.126493191081552e-09}, "score": 4.96886152278562}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9424733574660947, "4": 0.05742318140241781, "3": 0.00010309764593852956, "2": 2.252882823409235e-07, "1": 4.7658015730352945e-08}, "score": 4.942369751590994}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6442052902469039, "5": 0.348296447918939, "3": 0.007496360071856721, "2": 1.4746291846737654e-06, "1": 8.719332998105628e-08}, "score": 4.340796992859179}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9257751198157266, "4": 0.07409270496811106, "3": 0.0001320029879036992, "2": 5.1410932116939226e-08, "1": 8.03258052572242e-09}, "score": 4.925643094306639}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8388274711115637, "4": 0.16061295732427286, "3": 0.0005589812094241549, "2": 3.5280018092074604e-07, "1": 0}, "score": 4.8382679834361575}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9155838589417276, "4": 0.08421454745774741, "3": 0.0002011678346627941, "2": 3.175651000829748e-07, "1": 2.749254389850456e-08}, "score": 4.915382047378087}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8078826792107767, "4": 0.19114778627403034, "3": 0.0009666843864649653, "2": 2.3862176949429515e-06, "1": 2.4058364779315164e-07}, "score": 4.806910680843231}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8989598646008935, "3": 0.06646501234006415, "5": 0.034321688735262965, "2": 0.0002509507131666166, "1": 2.3891402136181174e-06}, "score": 3.9673476044635394}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9152894636683556, "3": 0.06189424352383154, "5": 0.022710241246538018, "2": 0.00010525011423859963, "1": 7.757255903381469e-07}, "score": 3.9606031693041155}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.823309652983786, "5": 0.12226905422393759, "3": 0.05432677932715249, "2": 9.292572870035277e-05, "1": 1.4211971189456263e-06}, "score": 4.067752171131426}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9272361586831896, "4": 0.07264600355829387, "3": 0.00011745726413826067, "2": 2.931759195739369e-07, "1": 5.3699507864931676e-08}, "score": 4.927117985137423}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "gpt35", "target_model": "llama", "scores": {"3": 0.5570576185335051, "4": 0.42020134068017256, "2": 0.021576942743885802, "5": 0.0011089196787196682, "1": 5.5014047293820755e-05}, "score": 3.4007322750460327}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8249957864449113, "3": 0.16306628571683587, "5": 0.011426686936684811, "2": 0.0005076423468364707, "1": 3.31854541186081e-06}, "score": 3.847335118142351}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8618527039566914, "3": 0.1207448786723793, "5": 0.016356699667067185, "2": 0.0010432003826373654, "1": 2.49848752292729e-06}, "score": 3.893517922761393}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6828970519373707, "4": 0.3135057743812009, "3": 0.003586359707463628, "2": 1.0232465502001494e-05, "1": 4.951772785545317e-07}, "score": 4.679288800410874}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8697035174099802, "4": 0.12965113664620362, "3": 0.0006430674116196828, "2": 2.033544964433952e-06, "1": 1.8198164620177697e-07}, "score": 4.869055891718869}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9528220965848486, "4": 0.04706959630912799, "3": 0.00010793709006034653, "2": 2.7240034395181236e-07, "1": 2.6817477941461237e-08}, "score": 4.952713601692019}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8990378887133497, "3": 0.0812345930299508, "5": 0.019649924164250272, "2": 7.703166398917408e-05, "1": 4.045789258301435e-07}, "score": 3.93826004432392}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8067864966224024, "4": 0.19314851079410192, "3": 6.498013176159488e-05, "2": 4.602067890765728e-08, "1": 0}, "score": 4.806721397368498}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7752107586146622, "5": 0.22141427161782282, "3": 0.0033735985005428327, "2": 1.2285530047577275e-06, "1": 2.8829346295697826e-08}, "score": 4.218038154354423}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.845498597015245, "4": 0.1543584011956713, "3": 0.0001426994339789302, "2": 2.2142785756358925e-07, "1": 2.2260055451933095e-08}, "score": 4.845355437540014}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6549699121832818, "4": 0.3446712206333034, "3": 0.0003580374385772307, "2": 7.399708821265521e-07, "1": 4.136916667068487e-08}, "score": 4.654610302381713}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5572505052678085, "3": 0.4392904795937406, "5": 0.0021607346486421297, "2": 0.0012942854657603119, "1": 3.7262581677780262e-06}, "score": 3.560270387164561}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.951404607626093, "4": 0.04857406172069467, "3": 2.1207408071296574e-05, "2": 4.1651144071805597e-08, "1": 1.251642569066449e-08}, "score": 4.9513833450857065}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8573371504408037, "5": 0.13420363075557318, "3": 0.00845572121377824, "2": 3.3875994982929756e-06, "1": 6.926479974385441e-08}, "score": 4.1257409316692675}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8542557986573497, "5": 0.1412792995533665, "3": 0.004457689930218025, "2": 6.928660870604914e-06, "1": 2.0542814983220597e-07}, "score": 4.136807146656457}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6376341070965215, "4": 0.36154744542730805, "3": 0.000816474399495987, "2": 1.8560453307556612e-06, "1": 1.3324490646958938e-07}, "score": 4.636813510546628}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5454421657242968, "4": 0.4534553367246118, "3": 0.001102143895606953, "2": 3.815400543461952e-07, "1": 2.056218762552583e-08}, "score": 4.5443391706905505}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.910981927508169, "4": 0.08896275321937253, "3": 5.499331090704548e-05, "2": 1.9902547606275067e-07, "1": 4.229770532506641e-08}, "score": 4.910926486352526}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9978387518672682, "4": 0.002159367336409515, "3": 1.8607200899985588e-06, "2": 9.350229018393118e-09, "1": 0}, "score": 4.997836883149522}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9936841304841475, "4": 0.006310912507300881, "3": 4.861230319154754e-06, "2": 1.9153507094375434e-08, "1": 0}, "score": 4.993679307087219}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9735326012792563, "4": 0.026411242690332192, "3": 5.599915257124296e-05, "2": 7.22538661976063e-08, "1": 0}, "score": 4.973476539998405}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5540819937651793, "5": 0.44297271599932553, "3": 0.0029431583662985336, "2": 2.09251681243201e-06, "1": 3.4104107682987385e-08}, "score": 4.440025272596453}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5903242362884897, "5": 0.4067168239282128, "3": 0.0029552950068313876, "2": 3.542534948286621e-06, "1": 1.0948973898283845e-07}, "score": 4.403754112455768}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8621119623810842, "4": 0.1377986661579309, "3": 8.926991722648442e-05, "2": 6.161681702580449e-08, "1": 0}, "score": 4.86202260364815}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5134633628835964, "4": 0.486026077069256, "3": 0.0005085843378920819, "2": 1.907502048251328e-06, "1": 6.002390124277304e-08}, "score": 4.5129507876675365}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9185712180401955, "5": 0.07170966806146391, "3": 0.009692140302677505, "2": 2.610671492253834e-05, "1": 5.820805480964798e-07}, "score": 4.061963585734539}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7785232679284543, "4": 0.21984023521752769, "3": 0.0016303383647014286, "2": 5.729295409395214e-06, "1": 2.728286212158678e-07}, "score": 4.776880773964254}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7095343990839252, "4": 0.2836369226776579, "3": 0.0067936766760956805, "2": 3.311778860000187e-05, "1": 1.8251068950773612e-06}, "score": 4.702669052733308}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5376415525878452, "4": 0.4565307138725444, "3": 0.005813774286560946, "2": 1.342027412536601e-05, "1": 4.7114049336956244e-07}, "score": 4.531799560408001}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9816164052109497, "4": 0.018319097207811424, "3": 6.396029869380288e-05, "2": 4.5878231437679817e-07, "1": 1.290687020914244e-07}, "score": 4.981551090505983}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.549360337675059, "4": 0.4482277702634629, "3": 0.0024081776002466996, "2": 3.5041204867264595e-06, "1": 1.1015261760244316e-07}, "score": 4.546944876173368}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5779915903402202, "4": 0.42060090248808213, "3": 0.0014058637449473374, "2": 1.5433456469203008e-06, "1": 4.5958684825888345e-08}, "score": 4.576582533233966}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.762438080270954, "4": 0.2371954248969748, "3": 0.0003658679800062418, "2": 5.431670074152692e-07, "1": 3.224831639092217e-08}, "score": 4.762071068410436}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9552844781310107, "4": 0.04461299922406756, "3": 0.00010224240955272866, "2": 2.4431437959936565e-07, "1": 1.2981754049708553e-08}, "score": 4.955181730058575}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9602594073811478, "4": 0.039627379425281134, "3": 0.00011234747881934397, "2": 6.955388277766985e-07, "1": 6.690875576335805e-08}, "score": 4.96014556724992}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7725242802189719, "4": 0.22679165553026234, "3": 0.000680194344426592, "2": 3.712355415179658e-06, "1": 1.6513607598286179e-07}, "score": 4.771836159900992}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9281021841752812, "3": 0.05073245170842337, "5": 0.021061081927929347, "2": 0.00010375886050938039, "1": 4.5324274230702286e-07}, "score": 3.970119750676099}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7340361653407667, "5": 0.26043395020884036, "3": 0.00552553059994699, "2": 4.339983550788681e-06, "1": 6.483106177884365e-08}, "score": 4.254899532157865}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8463050205255244, "5": 0.14648401047455473, "3": 0.007194459953803542, "2": 1.60628725789692e-05, "1": 1.962583369327903e-07}, "score": 4.139256870802991}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8766352321363482, "5": 0.12192291234316369, "3": 0.0014404841595419703, "2": 1.3097490552227647e-06, "1": 1.2597921461121396e-08}, "score": 4.120479776796938}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8831253934705544, "3": 0.10320681410140968, "5": 0.013536886313752777, "2": 0.00013075189000742588, "1": 1.5579886321096847e-07}, "score": 3.9100681011773446}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5281333343380992, "5": 0.4680251524300597, "3": 0.0038334963772112866, "2": 7.689713740823399e-06, "1": 2.923108634814467e-07}, "score": 4.464175415860017}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9629454005880786, "4": 0.03701495717689286, "3": 3.937068713094594e-05, "2": 1.4601536223291523e-07, "1": 2.9949835646380315e-08}, "score": 4.962905740057846}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6537165900467026, "5": 0.33951389669276727, "3": 0.006762565155713375, "2": 6.565302326586512e-06, "1": 2.0806652014156121e-07}, "score": 4.332737634874074}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.979195933610258, "4": 0.020782645323366152, "3": 2.1305016426425494e-05, "2": 7.054507286464832e-08, "1": 1.3955139131459217e-08}, "score": 4.979174476530966}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5333438717960495, "4": 0.46458251215598695, "3": 0.0020665742383052656, "2": 6.356230786035811e-06, "1": 4.6342883593811437e-07}, "score": 4.531263312829828}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7645631301335596, "5": 0.2340537006490551, "3": 0.0013825612800730577, "2": 5.885023011843173e-07, "1": 1.2381480361263136e-08}, "score": 4.232669926861084}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7538966193424219, "4": 0.24557833478900432, "3": 0.0005239768782991954, "2": 9.280084486991353e-07, "1": 5.0249411576308417e-08}, "score": 4.753370704054133}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.909487950136116, "5": 0.07540348385968774, "3": 0.015101448690424069, "2": 7.118930887962504e-06, "1": 8.438636504456901e-08}, "score": 4.060287538963454}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5370977130710544, "4": 0.4623400128663242, "3": 0.0005618322163863306, "2": 4.654342482208844e-07, "1": 2.0986845505421444e-08}, "score": 4.53653486310967}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8875525083896545, "5": 0.10528008542476675, "3": 0.007158825842033364, "2": 8.40561183149424e-06, "1": 1.492046475295541e-07}, "score": 4.098104003249436}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6042938758219498, "4": 0.3945241988578097, "3": 0.0011797006017845622, "2": 1.9094964297746025e-06, "1": 1.437058981239278e-07}, "score": 4.603110028552709}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6898630357550996, "4": 0.3074361670850357, "3": 0.002696469376527618, "2": 4.089544349933054e-06, "1": 1.3796524932304196e-07}, "score": 4.68715804229803}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8201768182146372, "4": 0.17890398745126615, "3": 0.0009179661882442853, "2": 1.1069578287944924e-06, "1": 1.2693800744710154e-07}, "score": 4.819256252586003}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5284011658281542, "5": 0.4703248278069672, "3": 0.001272979580488714, "2": 1.0592621257699524e-06, "1": 3.2569485973186135e-08}, "score": 4.469049601483396}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.756632887682931, "5": 0.2405967700729192, "3": 0.0027648734875760487, "2": 5.182209749966681e-06, "1": 2.0651578227167809e-07}, "score": 4.2378209316515525}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9923299553713888, "4": 0.007634193330895574, "3": 3.56820070654564e-05, "2": 9.388971388718128e-08, "1": 3.573186390088802e-08}, "score": 4.9922940177526876}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7318108207653469, "4": 0.2673422783985002, "3": 0.0008442330296468543, "2": 2.5787107325405205e-06, "1": 1.1638502047589286e-07}, "score": 4.730961061211797}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8967514819431435, "4": 0.10214822850130634, "3": 0.0010967155822415656, "2": 2.7895842153300874e-06, "1": 0}, "score": 4.895649889730476}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9816872863640959, "4": 0.01829464289443342, "3": 1.7930650339119836e-05, "2": 1.6886605672929573e-07, "1": 2.389252950219557e-08}, "score": 4.981668894602053}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987299791599461, "4": 0.0012697922177090665, "3": 2.4665160551584794e-07, "1": 0, "2": 0}, "score": 4.998729714501982}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9295484206084312, "3": 0.03811213285139358, "5": 0.03231272705147733, "2": 2.6472740891363586e-05, "1": 1.647512625769731e-07}, "score": 3.9941471539846}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.836467693785334, "4": 0.1631438095445153, "3": 0.00038787051432748166, "2": 5.564530702363563e-07, "1": 4.582028224845238e-08}, "score": 4.836078592871642}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8669850549575933, "4": 0.13189008403299426, "3": 0.0011244732221110721, "2": 2.6150223673450093e-07, "1": 0}, "score": 4.865860168076216}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9966068139118682, "4": 0.0033916345691759344, "3": 1.5091167681890475e-06, "2": 3.8944709298801985e-09, "1": 0}, "score": 4.996605335383153}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8087380331498688, "4": 0.19101139366849998, "3": 0.0002502302660053021, "2": 3.0484816620856556e-07, "1": 4.854211816910629e-08}, "score": 4.808487039092553}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7692167574103023, "4": 0.23002170613774525, "3": 0.0007608920979285018, "2": 5.913191194740399e-07, "1": 5.1841025659486266e-08}, "score": 4.7684545280684985}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9650148279595611, "4": 0.03495756785429565, "3": 2.749425456578875e-05, "2": 3.277591139681935e-08, "1": 8.604633497474643e-09}, "score": 4.964987308490149}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8215108368926822, "4": 0.17767975114084936, "3": 0.000807865478749331, "2": 1.3609902475103613e-06, "1": 1.0657445372940437e-07}, "score": 4.820699994482197}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9052124332090239, "4": 0.09458193340202782, "3": 0.00020470676857820417, "2": 8.362309550445682e-07, "1": 4.370676243589944e-08}, "score": 4.905005965106328}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9308689353238228, "4": 0.06904709299590217, "3": 8.357375688612202e-05, "2": 2.3339419240198467e-07, "1": 4.278454062318956e-08}, "score": 4.930784879743015}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8605353529321353, "3": 0.1345393981211408, "5": 0.004813407623786497, "2": 0.00011158833930393944, "1": 1.9682949314795454e-07}, "score": 3.8700502350383412}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9057274101584009, "4": 0.09409792346088679, "3": 0.00017419067942504854, "2": 3.5451010019424547e-07, "1": 5.953205083079474e-08}, "score": 4.905552387698203}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6591281645533987, "4": 0.33999237095204915, "3": 0.0008792365358050941, "2": 2.4997698083087036e-07, "1": 0}, "score": 4.658248413570163}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7849896154604746, "5": 0.2120595176667884, "3": 0.002946617431226718, "2": 4.0884484988978685e-06, "1": 9.249622537661014e-08}, "score": 4.209104460172871}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7797667441368984, "4": 0.22010781158660117, "3": 0.00012523920616953603, "2": 1.6645780218128328e-07, "1": 1.2348824013317671e-08}, "score": 4.779641155444917}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5117228546550241, "5": 0.48776248630566227, "3": 0.0005139131374900961, "2": 6.689155620204914e-07, "1": 2.192154267135782e-08}, "score": 4.48724719640255}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9349892192255287, "4": 0.06488359893988688, "3": 0.00012701288753506958, "2": 1.103936746038316e-07, "1": 0}, "score": 4.934862040289972}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8485439486083499, "5": 0.134096377832853, "3": 0.017329441554160545, "2": 2.928661418748906e-05, "1": 7.07844075395259e-07}, "score": 4.116706267241243}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8562700873517501, "4": 0.1435930531400844, "3": 0.00013648798079500223, "2": 2.674356126385446e-07, "1": 1.5687713666058603e-08}, "score": 4.856133093122216}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.830175105467381, "5": 0.08507570260288513, "3": 0.08378004720696423, "2": 0.0009554329207930104, "1": 1.3623027480075627e-05}, "score": 3.9993439204136525}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7270877407073764, "4": 0.2713877687068079, "3": 0.0015191845019089, "2": 4.657717670883462e-06, "1": 4.368456097679383e-07}, "score": 4.725558083703796}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6685724308448294, "5": 0.3305181845079243, "3": 0.0009086873248710648, "2": 7.03678331984842e-07, "1": 2.8144778162840463e-08}, "score": 4.329607994020337}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8444205048208895, "4": 0.15500868986333158, "3": 0.0005692926116766633, "2": 1.335712100112157e-06, "1": 1.4654211139497715e-07}, "score": 4.843848126853762}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8709043190506603, "4": 0.12899486262833956, "3": 0.00010072958580006714, "2": 9.653463317335693e-08, "1": 2.2090371546197384e-08}, "score": 4.870803304096339}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8639371550795543, "5": 0.13475627534487858, "3": 0.0013060611850882265, "2": 3.895691313363133e-07, "1": 0}, "score": 4.133449450878172}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7440457753750207, "4": 0.24738182147437174, "2": 0.007100227167671643, "5": 0.001464007852101634, "1": 8.104419725277904e-06}, "score": 3.2431934166655747}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7336985863538296, "5": 0.25965462406800244, "3": 0.006635501699265307, "2": 1.0949201792728657e-05, "1": 3.7664791437220304e-07}, "score": 4.252996084414945}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8577498775506878, "5": 0.13003448428135753, "3": 0.012199698996077014, "2": 1.564965008521935e-05, "1": 2.9952528467481995e-07}, "score": 4.117802586230819}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8239775620213812, "4": 0.1758208500142365, "3": 0.0002012116940312481, "2": 3.1665372825397266e-07, "1": 1.7790308397102633e-08}, "score": 4.82377569810447}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9248199028941744, "5": 0.06859682692895737, "3": 0.0065773391495320375, "2": 5.77101259369449e-06, "1": 5.582020144571382e-08}, "score": 4.062007784754505}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8611785938412916, "5": 0.11029247258217743, "3": 0.02850130794367632, "2": 2.7000099683102537e-05, "1": 4.724801979459148e-07}, "score": 4.081735759508441}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5516230204378988, "5": 0.44668129287449354, "3": 0.001693718282010282, "2": 1.563032052027109e-06, "1": 1.3985131701538854e-07}, "score": 4.444984147127611}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9277381332640804, "3": 0.057887720388277775, "5": 0.014324474516800979, "2": 4.8521236008809235e-05, "1": 8.625488948211359e-07}, "score": 3.9563371114329033}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.810516759535367, "4": 0.1888241727184415, "3": 0.0006585599504490546, "2": 4.3165335059463953e-07, "1": 4.9538633353183784e-08}, "score": 4.809857209207562}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5798299198983227, "5": 0.4172504658349304, "3": 0.00291826300792847, "2": 1.1674029233795639e-06, "1": 5.315328116549754e-08}, "score": 4.414329762715295}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7926755924602731, "3": 0.16703495117334724, "5": 0.03972046630779834, "2": 0.0005658163513452419, "1": 3.067336385022045e-06}, "score": 3.8715446667587026}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8096130836051767, "5": 0.1845342123316872, "3": 0.005843710642051317, "2": 8.79237226874812e-06, "1": 2.2293290170004672e-07}, "score": 4.1786722442363144}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9194794024539757, "4": 0.07969548059506337, "3": 0.0008237133209981747, "2": 1.2412631841149184e-06, "1": 6.83808515233386e-08}, "score": 4.918653087804517}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9938828603504143, "4": 0.0061045755427719854, "3": 1.237538671872266e-05, "2": 7.52304325266706e-08, "1": 4.3211161802999725e-08}, "score": 4.993870274717057}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9713411748370889, "4": 0.028603233731872332, "3": 5.532625434412188e-05, "2": 1.575184882272547e-07, "1": 1.6214725923205626e-08}, "score": 4.9712855737193244}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5801621416156568, "4": 0.4183967014442303, "3": 0.0014386622359460934, "2": 2.230617734201451e-06, "1": 1.7941217939892433e-07}, "score": 4.578718528910263}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5441679000216297, "5": 0.4529450786646708, "3": 0.002884460783375702, "2": 2.452398580202754e-06, "1": 1.0312933054599207e-07}, "score": 4.450055405947507}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7599318809862834, "4": 0.23880047699480556, "3": 0.0012653805145736617, "2": 2.1207876611612544e-06, "1": 1.1388427906861664e-07}, "score": 4.758661937600269}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5263213085407237, "4": 0.4730258220066781, "3": 0.0006522028009500402, "2": 6.720117576992907e-07, "1": 1.8354537826874965e-08}, "score": 4.5256676941866205}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.520705997880621, "5": 0.47666606816260915, "3": 0.002624681299561921, "2": 2.9866953974795526e-06, "1": 2.0299814416312176e-07}, "score": 4.474034834324791}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8444816937475168, "5": 0.1387441762790608, "3": 0.016757360238544523, "2": 1.654735975975957e-05, "1": 1.8146155932966623e-07}, "score": 4.121953181925858}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5560475871470819, "5": 0.44234000523799644, "3": 0.0016108718899763958, "2": 1.459093070278441e-06, "1": 9.195688601597422e-08}, "score": 4.440725932537091}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7044405762710778, "4": 0.29498832491051974, "3": 0.0005705498574102073, "2": 4.283856481433215e-07, "1": 2.768276000512386e-08}, "score": 4.703869151978315}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5755651219812582, "5": 0.4226776530374817, "3": 0.0017551446566842301, "2": 2.0209618429561927e-06, "1": 4.514031894037072e-08}, "score": 4.42091833702263}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9178366273950848, "4": 0.08207431185280185, "3": 8.883427524051294e-05, "2": 1.5222015132306788e-07, "1": 2.4725790209722762e-08}, "score": 4.917747459959056}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8998617901053386, "5": 0.09351796706734587, "3": 0.006613729257632188, "2": 6.2976878491636105e-06, "1": 1.2778010245049465e-07}, "score": 4.086891266748979}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7693098844278189, "4": 0.22855250816817446, "3": 0.0021325240517468076, "2": 4.676460675812636e-06, "1": 3.657049412953792e-07}, "score": 4.767166941936927}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5082608697914812, "4": 0.49020323919746095, "3": 0.0015346406954010823, "2": 1.1043131499648945e-06, "1": 5.607896781336111e-08}, "score": 4.506723897799284}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6587589716607176, "4": 0.3408560948524253, "3": 0.00038423469775808846, "2": 6.276821055467827e-07, "1": 2.6580446113461328e-08}, "score": 4.658373431172506}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9803132544459864, "4": 0.019643047894210234, "3": 4.338421034460244e-05, "2": 2.3743071080885035e-07, "1": 4.552865176737752e-08}, "score": 4.98026928867677}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7091772597120423, "3": 0.2821676446797711, "2": 0.005868714288810098, "5": 0.0027629039405617454, "1": 2.3548651506777915e-05}, "score": 3.708787205484169}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7872835682691933, "4": 0.2121290421711233, "3": 0.0005869542381697981, "2": 4.009833226123885e-07, "1": 5.3353513703951516e-08}, "score": 4.786695637044566}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6662804706425219, "5": 0.3153950181238848, "3": 0.018300615240508012, "2": 2.3120682377451306e-05, "1": 6.152740860786493e-07}, "score": 4.297046363234661}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941712146696223, "4": 0.005824582243245458, "3": 4.134008667786309e-06, "2": 2.4325759167714712e-08, "1": 0}, "score": 4.994167076501102}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7379363018227818, "5": 0.25980201988676876, "3": 0.0022604146705150945, "2": 1.2010198345183606e-06, "1": 4.5187063356536466e-08}, "score": 4.257539072099933}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7172950620160214, "4": 0.28213497155832745, "3": 0.0005694321054538142, "2": 4.342393314011461e-07, "1": 3.669200327655915e-08}, "score": 4.716724696788259}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8555670529961067, "3": 0.10304700867150307, "5": 0.0413241543038949, "2": 6.111324130275788e-05, "1": 4.1328640903015947e-07}, "score": 3.938153663365079}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.98561973210948, "4": 0.014348569904008042, "3": 3.1598655049558986e-05, "2": 5.468660711510197e-08, "1": 1.958196201124138e-08}, "score": 4.9855879900370175}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9939113603500517, "4": 0.0060732524116764, "3": 1.527938536253397e-05, "2": 6.730724188951024e-08, "1": 2.5119962203130323e-08}, "score": 4.993895886321864}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.821778586252473, "4": 0.17734216090643448, "3": 0.0008780034806878993, "2": 1.1131296561030667e-06, "1": 9.577223658246758e-08}, "score": 4.820898102408079}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8925115671680031, "5": 0.05648839839816884, "3": 0.050948115868856336, "2": 5.1380645659653515e-05, "1": 3.308710878891948e-07}, "score": 4.005436529750353}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.67430904460947, "4": 0.3249978539191155, "3": 0.0006917445623802365, "2": 1.2487643694285045e-06, "1": 8.208832789185404e-08}, "score": 4.673614573805295}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7148869504841526, "4": 0.28398078544317235, "3": 0.0011304369947471612, "2": 1.7348874794698808e-06, "1": 1.0536071429174092e-07}, "score": 4.713752718231991}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9698588088169121, "4": 0.03012462606585675, "3": 1.6495367071999387e-05, "2": 4.343362179606758e-08, "1": 0}, "score": 4.969842252105486}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5025404926034812, "4": 0.49673499715962965, "3": 0.0007234144236158283, "2": 1.0702471016827547e-06, "1": 1.8741041225876256e-08}, "score": 4.501814884887491}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8954857414980832, "4": 0.1038002707367393, "3": 0.0007104634886466274, "2": 3.2454225518468526e-06, "1": 2.6283641355078593e-07}, "score": 4.894768012987098}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8466105663919115, "5": 0.12599233590896097, "3": 0.027173278408902362, "2": 0.0002199843831089364, "1": 3.7951979034678076e-06}, "score": 4.0983677070462345}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6303830490483129, "5": 0.365645790392744, "3": 0.003968952789744998, "2": 2.21521963803366e-06, "1": 7.428847586585117e-08}, "score": 4.361672154735605}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8437175135465369, "4": 0.15614946834966872, "3": 0.0001327197228918237, "2": 2.2688671429591864e-07, "1": 0}, "score": 4.843584400361599}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9768918823105011, "4": 0.022997618773493298, "3": 0.00010858242456276469, "2": 1.7865110039501734e-06, "1": 1.3354571276530942e-07}, "score": 4.976779322744305}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7259735770990743, "4": 0.27199978585071427, "3": 0.0020246397408577484, "2": 1.9323484138524966e-06, "1": 8.206723390227977e-08}, "score": 4.723944814075673}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6274162393458783, "5": 0.3701872426993993, "3": 0.0023941260997210993, "2": 2.1994768969200577e-06, "1": 5.99607293406081e-08}, "score": 4.367788586465296}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8674530410332966, "5": 0.11336461198667883, "3": 0.019172360392599334, "2": 9.923528543143998e-06, "1": 4.692820295049151e-08}, "score": 4.094172265271447}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7401103738906321, "5": 0.25871526110883314, "3": 0.0011730066970406842, "2": 1.3570545214356117e-06, "1": 1.7501486793451604e-08}, "score": 4.257539483612625}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6329802993450041, "4": 0.3633195241775921, "3": 0.0036914619757710803, "2": 8.482002433586872e-06, "1": 2.912837380433042e-07}, "score": 4.629270962521748}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8686632093502065, "5": 0.11488875116591384, "3": 0.016383820270554454, "2": 6.255396085716374e-05, "1": 1.505746152847666e-06}, "score": 4.098375321426672}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9235899803814085, "3": 0.05690742808846936, "5": 0.019322891458169063, "2": 0.00017782475768598547, "1": 1.61311897736636e-06}, "score": 3.962054964548386}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9164604737675845, "5": 0.05647740117761489, "3": 0.026985354124091223, "2": 7.494043200027413e-05, "1": 1.5438473157723229e-06}, "score": 4.029337543057223}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9273946405938638, "4": 0.07253768203057559, "3": 6.730493470531204e-05, "2": 2.2395280483300462e-07, "1": 3.4936839199460565e-08}, "score": 4.9273268882421215}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8641104264099695, "3": 0.12608507518431805, "5": 0.00835822662987822, "2": 0.0014380057803161774, "1": 8.292003013236566e-06}, "score": 3.879372267013113}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8888879605839367, "3": 0.10709153959787909, "5": 0.003984769939599868, "2": 3.550706028462914e-05, "1": 9.926627013331914e-08}, "score": 3.896821905674478}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.850309370859645, "4": 0.14929194913051874, "3": 0.00039787662029433697, "2": 7.643416208585701e-07, "1": 5.908327189865031e-08}, "score": 4.849909771278053}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9652662345197005, "4": 0.034679019508641266, "3": 5.4675382256210105e-05, "2": 1.965517843032664e-08, "1": 0}, "score": 4.965211568989389}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948302921738092, "4": 0.005161087323906789, "3": 8.548318166818147e-06, "2": 3.744655951356655e-08, "1": 7.2197970056346155e-09}, "score": 4.9948216746783975}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.99798097038796, "4": 0.0020168588552990055, "3": 2.1121714847194983e-06, "2": 5.607319719161003e-09, "1": 1.8709191551901714e-09}, "score": 4.997978892392802}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7800614268714595, "5": 0.2129492509737375, "3": 0.006977829991597126, "2": 1.1203907013531948e-05, "1": 2.503009107203801e-07}, "score": 4.205948270082206}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9048194300468902, "5": 0.05267564892269714, "3": 0.04220289324425151, "2": 0.0002983745444728108, "1": 3.493061449884068e-06}, "score": 4.009865528985412}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7140139849997418, "4": 0.28505931430474485, "3": 0.0009259475188797976, "2": 6.486523072063518e-07, "1": 1.8404456510499035e-08}, "score": 4.713086746373817}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9718400195580402, "4": 0.028069707753757618, "3": 8.971585936612587e-05, "2": 3.8434086839496907e-07, "1": 4.946443057066721e-08}, "score": 4.971749506171707}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.867474120398307, "4": 0.13226235381719828, "3": 0.0002624077411488596, "2": 1.0174602365001708e-06, "1": 1.0698277465249823e-07}, "score": 4.867209351238511}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6344435268279965, "5": 0.3614081680300986, "3": 0.004141316692677155, "2": 6.568901098234854e-06, "1": 3.190927576807996e-07}, "score": 4.357252792144914}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9993135371934755, "4": 0.0006854253249860464, "3": 1.0101956833361888e-06, "2": 1.2158661992184283e-08, "1": 6.926321311284686e-09}, "score": 4.999312490096739}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8482618122330661, "4": 0.15158511448616577, "3": 0.00015298632800638857, "2": 7.295266724502681e-08, "1": 9.016478403535763e-09}, "score": 4.848108657176937}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9918877066959048, "4": 0.008109421865640152, "3": 2.852296781476256e-06, "2": 5.806818537316904e-09, "1": 2.0083547146413978e-09}, "score": 4.991884847995006}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9428467545359951, "4": 0.057130480250839166, "3": 2.2697313238940455e-05, "2": 3.106174000589192e-08, "1": 4.00892384289711e-09}, "score": 4.942824014024723}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9494460630289623, "4": 0.050428519542850436, "3": 0.00012491038472170073, "2": 4.2667680809955646e-07, "1": 5.834197615551732e-08}, "score": 4.949320145173169}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5624941752884113, "4": 0.43434771891976054, "3": 0.003154183537991856, "2": 3.681775313370577e-06, "1": 1.4049780093546153e-07}, "score": 4.559332262628834}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5419143314991236, "5": 0.45633587619485194, "3": 0.0017473935522811241, "2": 2.2228197730956925e-06, "1": 9.661401726421684e-08}, "score": 4.454583783218537}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9547203582189977, "4": 0.04521697543177779, "3": 6.239318520570076e-05, "2": 1.7070771703425613e-07, "1": 3.222639498989742e-08}, "score": 4.954657593984686}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5943545988339055, "4": 0.4043725671769126, "3": 0.0012687298462873064, "2": 4.0100052797531215e-06, "1": 1.199425450585752e-07}, "score": 4.593077473845101}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6393063618398591, "3": 0.354202462985515, "5": 0.005596261463421158, "2": 0.0008934885841493694, "1": 1.3499945534548017e-06}, "score": 3.6496027449997244}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8726795047178616, "4": 0.12716553704073993, "3": 0.00015467166161546865, "2": 3.257423843607033e-07, "1": 3.137783766745548e-08}, "score": 4.872524025889737}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5991767795199903, "4": 0.3992504598911557, "3": 0.0015671791427973461, "2": 5.384204410788298e-06, "1": 2.2215844354091054e-07}, "score": 4.597598150602808}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9984821266367981, "4": 0.0015159954395179865, "3": 1.8504883143518281e-06, "2": 1.2056547060912986e-08, "1": 6.727689942392014e-09}, "score": 4.998480240490305}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6881919106823712, "4": 0.31113097934929557, "3": 0.0006760226341577209, "2": 1.0463663653137498e-06, "1": 4.612932371040378e-08}, "score": 4.6875136533789}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7080471722756152, "5": 0.282199870064828, "3": 0.009735502729918293, "2": 1.6390609149087394e-05, "1": 8.407588164248376e-07}, "score": 4.272429124744873}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9901961907622041, "4": 0.009788774588383458, "3": 1.4888819437589088e-05, "2": 4.8770900654852734e-08, "1": 1.9221815095731487e-08}, "score": 4.990181223808514}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.890916741286854, "4": 0.10858505457146017, "3": 0.0004975298515749579, "2": 4.988202632340714e-07, "1": 9.284670844670798e-08}, "score": 4.890418008823759}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.80083795960534, "4": 0.19792322025148612, "3": 0.0012351597068197468, "2": 3.056130453217246e-06, "1": 3.450198104394442e-07}, "score": 4.799595859902268}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6194282895378228, "5": 0.3788916494988467, "3": 0.0016778954150918645, "2": 1.954771990947408e-06, "1": 1.112236275202532e-07}, "score": 4.377209548421089}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9490503271576487, "4": 0.050806244943223285, "3": 0.00014279079084775654, "2": 3.673552402410892e-07, "1": 1.565473995967866e-07}, "score": 4.948906439435683}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996208766254361, "4": 0.00037857702694199394, "3": 4.6886779276412936e-07, "1": 9.87509407127041e-09, "2": 7.33504713010441e-09}, "score": 4.999620423709077}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8932778046957126, "4": 0.10643114805906505, "3": 0.00029057742324128477, "2": 3.8257963854696643e-07, "1": 4.12451214103513e-08}, "score": 4.892986379452721}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8977705190971196, "4": 0.10215280484445252, "3": 7.642551129928057e-05, "2": 2.0343790779973175e-07, "1": 0}, "score": 4.8976937289996565}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9682514878017725, "4": 0.03172876170973385, "3": 1.9643461954029874e-05, "2": 6.513270714485714e-08, "1": 0}, "score": 4.968231754637343}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7378506250128406, "3": 0.2557381268645774, "5": 0.004896912375148773, "2": 0.0015107642958758164, "1": 3.4486869278189405e-06}, "score": 3.7461268796913973}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8758042078917847, "5": 0.116406186089285, "3": 0.007777738222192787, "2": 1.1697949358805975e-05, "1": 9.577424782055377e-08}, "score": 4.108604772690327}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5719642726243583, "4": 0.42603147945867553, "3": 0.002003508670942521, "2": 6.586780269906518e-07, "1": 6.028195691274328e-08}, "score": 4.569959277313708}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9277616238910047, "4": 0.07208039396743916, "3": 0.00015731175828412452, "2": 6.438075441452024e-07, "1": 0}, "score": 4.927603049169358}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7506643534088241, "4": 0.2481682587915216, "3": 0.0011635906113488567, "2": 3.5523755828829863e-06, "1": 2.4715701846601146e-07}, "score": 4.74949291481822}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8591547859851987, "4": 0.14052146866433038, "3": 0.00032338014734897293, "2": 3.236646137601184e-07, "1": 2.2443764766963452e-08}, "score": 4.85883070757648}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9996400503274331, "4": 0.0003596869817079768, "3": 2.1459291976531043e-07, "2": 2.5822053921245003e-09, "1": 0}, "score": 4.999639876069445}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9960518282059773, "4": 0.003943350248928689, "3": 4.803719712775301e-06, "2": 2.0317870864831643e-08, "1": 0}, "score": 4.996046981367887}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9998537999282723, "4": 0.0001460194099834836, "3": 1.5433612239773364e-07, "2": 2.168587072776393e-09, "1": 0}, "score": 4.999853665408475}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9997179661490261, "4": 0.00028193880898124, "3": 7.688208134539592e-08, "2": 1.3265383925838588e-09, "1": 0}, "score": 4.999717903442492}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9815750554908148, "4": 0.0184167334686859, "3": 8.214579455957134e-06, "2": 3.561157897018124e-08, "1": 0}, "score": 4.9815667312593375}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8470456073754182, "5": 0.11622382745901755, "3": 0.03655701435432154, "2": 0.0001711413046008053, "1": 2.0876135217988147e-06}, "score": 4.079318293186941}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5645439172072774, "4": 0.4344587827983027, "3": 0.0009955718124449976, "2": 1.6849073177085726e-06, "1": 9.818150298201832e-08}, "score": 4.563544650093229}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8573828820240588, "5": 0.12134442370846123, "3": 0.02106652060138567, "2": 0.00020140515141059447, "1": 4.569307026020816e-06}, "score": 4.099861404776333}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5217670787352213, "4": 0.47469936078121366, "3": 0.0035237884638297367, "2": 9.375131120677547e-06, "1": 4.2998909028968493e-07}, "score": 4.5182232328884435}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8714738850415087, "4": 0.1282221080083686, "3": 0.0003030484088604503, "2": 8.71288226820541e-07, "1": 1.1575296832875249e-07}, "score": 4.87116872196904}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5500355865668177, "4": 0.44878042142547736, "3": 0.0011830067360044817, "2": 9.958247984556006e-07, "1": 5.037599827512434e-08}, "score": 4.548850403612263}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.998057309271136, "4": 0.0019397200896545765, "3": 2.97267600212428e-06, "2": 1.140409882630602e-08, "1": 8.803292831979076e-09}, "score": 4.998054265176155}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.985229975890882, "4": 0.01476073004484659, "3": 9.230973903596125e-06, "2": 1.8018424846334495e-08, "1": 0}, "score": 4.985220753285943}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9950860242778938, "4": 0.004910951832780036, "3": 2.9781686301601033e-06, "2": 1.1083946907165056e-08, "1": 0}, "score": 4.995083058407811}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "human", "scores": {"4": 0.811854647813161, "3": 0.18676341939761948, "5": 0.0012782849273855004, "2": 0.00010339944121653017, "1": 1.9006428118074287e-07}, "score": 3.8143074856181545}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8934319218095644, "4": 0.10650473869859867, "3": 6.308105949234161e-05, "2": 1.773912662933782e-07, "1": 2.2499516879247702e-08}, "score": 4.8933684707681735}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6052389138365244, "5": 0.39424232132232506, "3": 0.0005184670920021394, "2": 2.374734521834043e-07, "1": 4.790063863242226e-08}, "score": 4.39372324045385}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7196737101762724, "5": 0.27961908855841333, "3": 0.0007063170090031401, "2": 8.041154367713266e-07, "1": 8.992867327429401e-08}, "score": 4.278910890802594}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8498817133043091, "5": 0.14886323209090596, "3": 0.0012523168039679069, "2": 2.6663914940719307e-06, "1": 9.366062126673096e-08}, "score": 4.147605298237676}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8901444731926536, "3": 0.07769930238211495, "5": 0.03202413953821868, "2": 0.00013030496111494537, "1": 1.4524191680392927e-06}, "score": 3.9540598549306627}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5159221484398188, "4": 0.4757968031644381, "3": 0.008261230761054969, "2": 1.8224257894376953e-05, "1": 1.3522441666696012e-06}, "score": 4.5076205348343485}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5656395166849009, "4": 0.4307855829591623, "3": 0.0035639300371341294, "2": 1.0661728544283924e-05, "1": 3.176263960621629e-07}, "score": 4.5620533052327}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9562469723656236, "4": 0.04366248990737879, "3": 9.001655140881389e-05, "2": 4.1751389991505297e-07, "1": 0}, "score": 4.956156219903184}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8934883616866999, "4": 0.10600316784356245, "3": 0.0005010680188134906, "2": 6.843864503379823e-06, "1": 4.43811461925596e-07}, "score": 4.892972376995362}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7487212407297495, "3": 0.24464071846014582, "5": 0.005815323863880318, "2": 0.000819742984805861, "1": 2.8511789002569517e-06}, "score": 3.7595265363714843}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5533477126059753, "5": 0.4425308497566884, "3": 0.004117086606923154, "2": 4.113094060104369e-06, "1": 8.830580409116e-08}, "score": 4.438405337643064}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6262161061273772, "5": 0.3443116405107197, "3": 0.029463946960115017, "2": 8.092158917587267e-06, "1": 8.770911579846634e-08}, "score": 4.3148312859422076}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9280414047534835, "4": 0.07192110677236205, "3": 3.746598886980498e-05, "2": 2.19251380991729e-08, "1": 0}, "score": 4.928003895434156}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8879779121537985, "3": 0.07413600257235221, "5": 0.0374584560042741, "2": 0.0004251425642478459, "1": 2.348081373694335e-06}, "score": 3.962465118856071}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8701621720930942, "4": 0.12962896819729353, "3": 0.00020844548786456613, "2": 3.313273425355598e-07, "1": 5.035736260357437e-08}, "score": 4.8699529411841525}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8571601028825686, "4": 0.1413465362384329, "3": 0.0014747488129463143, "2": 1.65116890599262e-05, "1": 2.016673875435313e-06}, "score": 4.855646352290142}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.914102627421849, "4": 0.08558383133064068, "3": 0.00031315383579560394, "2": 2.787996258673907e-07, "1": 1.8174324148416437e-08}, "score": 4.9137889441048594}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9718709925930162, "4": 0.02809411093144064, "3": 3.474259855021759e-05, "2": 9.937860379755273e-08, "1": 1.723730338721404e-08}, "score": 4.971836035737015}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5641040492575774, "4": 0.4338371698320095, "3": 0.002055994718943015, "2": 2.6634640711970806e-06, "1": 1.3495937901115467e-07}, "score": 4.562042315857465}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9234047498980166, "4": 0.076436037423305, "3": 0.00015896762386002214, "2": 1.9724701705428478e-07, "1": 4.518954871336775e-08}, "score": 4.923245254628767}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8021886935890478, "4": 0.19753948313769204, "3": 0.00027130036308086684, "2": 4.0080532553542386e-07, "1": 5.9425167798618524e-08}, "score": 4.801916463603685}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7760971525890417, "5": 0.21632075412042345, "3": 0.007570864630677603, "2": 1.0582424489383885e-05, "1": 6.035873909595216e-07}, "score": 4.208726922780375}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.978949330671414, "4": 0.021036972374865997, "3": 1.3678654580296762e-05, "2": 3.60577506174748e-08, "1": 1.330664902431723e-08}, "score": 4.978935509570499}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9280347321597713, "5": 0.06016244250590939, "3": 0.011767528061860991, "2": 3.457668316626341e-05, "1": 6.666031137443818e-07}, "score": 4.04832376387719}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7573918227859815, "5": 0.22565818057209755, "3": 0.01685642313271789, "2": 9.21129515247135e-05, "1": 1.2986114236682586e-06}, "score": 4.208613669486263}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7569201222019337, "4": 0.24254160895590848, "3": 0.0005354689248066353, "2": 2.5002295757656606e-06, "1": 2.3652190777654335e-07}, "score": 4.756378991029589}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8967139043596424, "5": 0.08026659075173985, "3": 0.022973440297204505, "2": 4.5057865241155225e-05, "1": 8.118964739892939e-07}, "score": 4.05720061017901}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7971894775424411, "5": 0.2000642327992434, "3": 0.0027416317682105195, "2": 4.535977281676991e-06, "1": 9.331266438383066e-08}, "score": 4.197313254781666}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8836960591116795, "5": 0.10143240124108592, "3": 0.014799957053600916, "2": 6.973989655590416e-05, "1": 1.7254131998848963e-06}, "score": 4.086487798298398}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9077095957554819, "3": 0.06750090323053967, "5": 0.024650980559365702, "2": 0.0001359941075506925, "1": 2.2657629782792733e-06}, "score": 3.956871280586132}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9261886725835143, "3": 0.059738211781204135, "5": 0.013959606077362787, "2": 0.00011292349544515868, "1": 4.751981319439903e-07}, "score": 3.9539941166104615}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7481609128593683, "5": 0.2460987994250282, "3": 0.005718077680026618, "2": 2.1110690226040165e-05, "1": 7.77356325750744e-07}, "score": 4.240336245681205}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9903837071149252, "4": 0.009608736906174255, "3": 7.341480739918771e-06, "2": 6.891327547883504e-08, "1": 0}, "score": 4.990376371991465}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5472757665480209, "4": 0.4489111926504328, "3": 0.003800183210965699, "2": 1.1403833353583146e-05, "1": 1.306358581623643e-06}, "score": 4.54344893669824}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8708806394841505, "5": 0.12175001424711741, "3": 0.0073340455393896276, "2": 3.3982733519605246e-05, "1": 1.2965573480144121e-06}, "score": 4.114344116020008}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5645912561993947, "4": 0.41276844876137064, "2": 0.021004552059724756, "5": 0.0016121461100763285, "1": 2.3597872459916593e-05}, "score": 3.394940992780742}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6709822469238719, "4": 0.32667339475792445, "3": 0.0023420126791694053, "2": 1.9784872903960887e-06, "1": 1.5789382870723334e-07}, "score": 4.668635943506}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9364139134767085, "4": 0.06355686258509007, "3": 2.903388389108972e-05, "2": 1.1680079033598064e-07, "1": 0}, "score": 4.9363847145847135}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7169356438086656, "4": 0.28289275804354375, "3": 0.00017112162448240482, "2": 2.1498426447188893e-07, "1": 0}, "score": 4.716764279677498}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5339035629807233, "5": 0.45727157891909787, "3": 0.00882154724275367, "2": 3.090780221684767e-06, "1": 1.8518972441387283e-07}, "score": 4.448443310191784}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8496258864272537, "5": 0.09656962772368727, "3": 0.05377441943900308, "2": 2.9850110986257393e-05, "1": 1.568967329378596e-07}, "score": 4.042735039911074}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.567005741048301, "4": 0.4287410737331476, "3": 0.004251080895622618, "2": 1.919918155839643e-06, "1": 8.3597936514608e-08}, "score": 4.562750626251667}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983562798900703, "4": 0.0016423305152369672, "3": 1.358732877834693e-06, "2": 4.838229446422672e-09, "1": 0}, "score": 4.9983549374615075}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6589482603032872, "4": 0.34054588662178964, "3": 0.0005056160354248319, "2": 2.3913968492249064e-07, "1": 0}, "score": 4.658442164605641}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9294490386043563, "5": 0.05650815019466169, "3": 0.014040573972330009, "2": 2.1242643579875925e-06, "1": 0}, "score": 4.042463332490455}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.861262588685491, "4": 0.13837261830353986, "3": 0.0003646273809274891, "2": 1.710703434203264e-07, "1": 3.7759188005196323e-08}, "score": 4.860897468695981}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6004988214971468, "5": 0.39791512906206156, "3": 0.0015828741534683899, "2": 2.9069910940922046e-06, "1": 2.1048846151119762e-07}, "score": 4.396325832371732}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5346839576512384, "5": 0.4632973529705941, "3": 0.0020176381183797804, "2": 9.018153947226126e-07, "1": 8.941726970397374e-08}, "score": 4.461277670658788}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7563980652809165, "5": 0.24259264507924472, "3": 0.0010084497785253638, "2": 7.085288916714715e-07, "1": 5.665729979288838e-08}, "score": 4.241582626311248}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9184385620531762, "4": 0.08151824652917485, "3": 4.306917560063785e-05, "2": 3.262979529115485e-08, "1": 3.075793254540309e-09}, "score": 4.9183954978653}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6637354815740354, "5": 0.3296941079524465, "3": 0.006565265042457742, "2": 5.058325794838121e-06, "1": 1.1441598943258113e-07}, "score": 4.3231183741858334}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9268996052336985, "4": 0.07302117583261133, "3": 7.895053822471875e-05, "2": 1.363053837169699e-07, "1": 1.7136536763464644e-08}, "score": 4.92682043721639}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9431957318023234, "4": 0.05674235757336302, "3": 6.17046663656154e-05, "2": 9.318892060035234e-08, "1": 1.437141029581307e-08}, "score": 4.943133890446013}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5580737091911521, "5": 0.44046334470358217, "3": 0.0014584359275429074, "2": 4.426660923442661e-06, "1": 7.592855534839914e-08}, "score": 4.438995830999733}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5755522467334897, "3": 0.41498350770956133, "2": 0.007997344739166566, "5": 0.0014415999583524655, "1": 2.5014797705115987e-05}, "score": 3.57038823548186}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9893277983879203, "4": 0.010654733771439322, "3": 1.7349064020011456e-05, "2": 5.8690849976812186e-08, "1": 3.386875259482465e-08}, "score": 4.989310256272708}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.810120813474595, "5": 0.1869684112861921, "3": 0.002909662162206556, "2": 1.0487422174281662e-06, "1": 1.8773003183979685e-08}, "score": 4.1840566037064875}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9988474669769418, "4": 0.001151218422100051, "3": 1.3099219535090885e-06, "1": 6.667812445519616e-09, "2": 5.601065440890815e-09}, "score": 4.998846118268305}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7432683712145366, "5": 0.25505739008215894, "3": 0.0016730951244274916, "2": 1.1440224969888284e-06, "1": 2.2817295819370836e-08}, "score": 4.253381932566954}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6740375213234255, "5": 0.1777912090567667, "3": 0.14687883261854956, "2": 0.0012782456846406089, "1": 1.4191448401698649e-05}, "score": 4.028313310719999}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8375796042073841, "5": 0.126559364032889, "3": 0.035804632303272424, "2": 5.544976955958873e-05, "1": 8.57177347372357e-07}, "score": 4.090641269043638}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6995613382603622, "5": 0.2856551685440614, "3": 0.014762855743019653, "2": 2.0232081911372415e-05, "1": 2.7612670513405735e-07}, "score": 4.270851055262961}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9156554054597513, "4": 0.08425728033595084, "3": 8.710358633844828e-05, "2": 1.5905257961330662e-07, "1": 0}, "score": 4.915568030979867}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5803299255575596, "5": 0.4184865617842741, "3": 0.001181284113995994, "2": 1.937564085265215e-06, "1": 8.937006984742879e-08}, "score": 4.4173012185640035}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5468329588888392, "4": 0.4481118556236893, "5": 0.004102888668747594, "2": 0.0009493917894790984, "1": 2.7923081786020987e-06}, "score": 3.4553627078843183}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9947945361286175, "4": 0.005200585830650015, "3": 4.8034266948099576e-06, "2": 6.736253008954496e-09, "1": 3.166126248310801e-09}, "score": 4.994789774105534}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8598462025255115, "4": 0.13969351984717465, "3": 0.000459776709712944, "2": 5.21968288974536e-07, "1": 4.621862414814832e-08}, "score": 4.859385185413098}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9578009300947725, "4": 0.042022516382757405, "3": 0.00017564476206379063, "2": 7.009137471950033e-07, "1": 8.701520181936817e-08}, "score": 4.95762373817068}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7587031536478868, "5": 0.23217741029549707, "3": 0.009108598695626254, "2": 1.0292490564893785e-05, "1": 4.017925203880671e-07}, "score": 4.223047053154285}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5949276365954671, "5": 0.4013621468025736, "3": 0.0037062081018894217, "2": 3.703560143450922e-06, "1": 1.5649465201158977e-07}, "score": 4.3976481211254255}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6086474492302085, "4": 0.39056769892641063, "3": 0.0007838119704407822, "2": 9.451482910666025e-07, "1": 5.479280210874288e-08}, "score": 4.607861606857816}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.778060480027985, "5": 0.2184980475902815, "3": 0.0034386803513188715, "2": 2.3507315038762855e-06, "1": 1.2090671972721e-07}, "score": 4.215054371957536}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.69091688130267, "4": 0.30715560596012953, "3": 0.0019245790701695887, "2": 2.820196484744955e-06, "1": 1.3965775701256503e-07}, "score": 4.6889862248236325}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9910534596011699, "4": 0.008932584573906253, "3": 1.3889616657930433e-05, "2": 2.234484927367384e-08, "1": 0}, "score": 4.9910395687651965}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9010161022516773, "3": 0.06224130077432339, "5": 0.0366904784632821, "2": 5.1546074488162984e-05, "1": 4.490215297088288e-07}, "score": 3.974344735309156}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9824572584842582, "4": 0.017523602367961567, "3": 1.91672301525069e-05, "2": 2.7952812955342996e-08, "1": 8.265513319330716e-09}, "score": 4.982437947380492}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7670441402906857, "4": 0.23247897224542674, "3": 0.0004766139613910913, "2": 2.967457872056595e-07, "1": 0}, "score": 4.766566915020183}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9410141107741468, "3": 0.04499540524912259, "5": 0.013916452579231296, "2": 7.346290301825419e-05, "1": 4.1455880612389417e-07}, "score": 3.9687728730406846}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7218289135581635, "4": 0.2780479216809356, "3": 0.00012300949628536254, "2": 1.6609515332705422e-07, "1": 0}, "score": 4.721705564055111}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6380130763506311, "4": 0.3519171149511394, "2": 0.009419521385669413, "5": 0.0006385184417372585, "1": 1.1638139095062568e-05}, "score": 3.3437513991099688}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9702118133930453, "4": 0.029705246468589, "3": 8.262997911536777e-05, "2": 1.7811436374769302e-07, "1": 2.8614879276011823e-08}, "score": 4.9701288416809986}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8034604477254838, "5": 0.1762378104938545, "3": 0.02028375418069485, "2": 1.7705185414820064e-05, "1": 2.0044839597703305e-07}, "score": 4.1559180573771455}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9865687224960488, "4": 0.013412931500817979, "3": 1.8075538460814286e-05, "2": 1.1919559949319595e-07, "1": 2.8956388027927142e-08}, "score": 4.986550442364859}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7953407021247463, "4": 0.2041894785090424, "3": 0.00046819485118958557, "2": 1.5179193644498283e-06, "1": 9.756363550442391e-08}, "score": 4.794869185923197}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8331951171251285, "4": 0.16605013801407267, "3": 0.000753233413582865, "2": 1.3370845810873182e-06, "1": 1.4091724975790557e-07}, "score": 4.832438814631872}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5961952529183934, "5": 0.40128629251204195, "3": 0.0025092198271285736, "2": 8.983535903292332e-06, "1": 2.412398910472654e-07}, "score": 4.3987583858677155}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.932411321102196, "4": 0.06738215895741874, "3": 0.00020618144002718548, "2": 2.494615604392582e-07, "1": 4.0628745647210484e-08}, "score": 4.932204563980883}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9389039731680944, "3": 0.045069704444509764, "5": 0.01566995647842507, "2": 0.00035171653678970586, "1": 4.563448364241615e-06}, "score": 3.969883126027487}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9979856027269811, "4": 0.002013151247050884, "3": 1.1861129806440816e-06, "2": 6.433642331847509e-09, "1": 0}, "score": 4.99798445711827}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9702389602993674, "4": 0.029613581157222953, "3": 0.00014651291154173322, "2": 6.210203411961671e-07, "1": 8.630260965281797e-08}, "score": 4.970091177620693}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9847603036222762, "4": 0.015224230629944612, "3": 1.5275978439484163e-05, "2": 1.0319741837066297e-07, "1": 4.400665343623573e-08}, "score": 4.9847447311449615}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7692190727562266, "5": 0.21047899859118324, "3": 0.020259632895399962, "2": 4.1009984357161164e-05, "1": 1.0645206010557492e-06}, "score": 4.190134194232881}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9628820659002112, "4": 0.0370358950548034, "3": 8.144480552217219e-05, "2": 4.7249579004971544e-07, "1": 8.664903132641724e-08}, "score": 4.962799449945117}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6811549538653454, "5": 0.3169284310984899, "3": 0.0019141588417016543, "2": 2.3312102608121354e-06, "1": 8.381473580406792e-08}, "score": 4.315009371360826}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9466096037884736, "3": 0.04909276536236568, "5": 0.004086155608412251, "2": 0.0002090121863091519, "1": 2.119093828596207e-06}, "score": 3.954568992965465}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6562110166767363, "5": 0.3412309016192622, "3": 0.002555338445773107, "2": 2.35851116568924e-06, "1": 1.4673890292605216e-07}, "score": 4.338670486540788}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5020533952032724, "5": 0.49294414869904535, "3": 0.0049964650828933374, "2": 5.57136762529159e-06, "1": 2.6780010810802685e-07}, "score": 4.487935811572195}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7582006261975647, "4": 0.24136443723472537, "3": 0.0004341716044743562, "2": 6.098181737696077e-07, "1": 7.447785530313119e-08}, "score": 4.757765072649969}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.908466045579585, "4": 0.09146656347389587, "3": 6.687702987083533e-05, "2": 3.5864600264350004e-07, "1": 1.3500446297234662e-07}, "score": 4.90839806465408}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.706116599518604, "5": 0.29000309025693394, "3": 0.0038724147504580215, "2": 7.585196796620204e-06, "1": 2.3244225694280817e-07}, "score": 4.286114830055845}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8474284568389722, "4": 0.15176091865999267, "3": 0.0008072783739847204, "2": 3.2096585410021297e-06, "1": 1.762204621389354e-07}, "score": 4.846614196831951}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5779582758650853, "3": 0.41518077549364457, "5": 0.005074579574241028, "2": 0.0017738417575561913, "1": 1.2231377276628226e-05}, "score": 3.5863093040092573}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9490580524587536, "4": 0.05088609375115614, "3": 5.5446109995564825e-05, "2": 2.8636975828944356e-07, "1": 0}, "score": 4.949002148733012}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8077842689370867, "4": 0.1920222746272171, "3": 0.00019295279200296574, "2": 4.3844257128227665e-07, "1": 0}, "score": 4.8075904919157475}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7391037836039713, "4": 0.2522667801646386, "2": 0.007083400428966506, "5": 0.0015376945956746236, "1": 8.302673388692458e-06}, "score": 3.248242173145849}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6888926952069684, "4": 0.3102253221134402, "3": 0.000881385021224678, "2": 5.847648712482698e-07, "1": 3.5814643172634694e-08}, "score": 4.6880100174420924}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9129181289235002, "5": 0.062377290758353264, "3": 0.02467021335795891, "2": 3.378664337480551e-05, "1": 4.6595303088169363e-07}, "score": 4.037638110558988}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7680828147055712, "4": 0.23173673837821282, "3": 0.00018030206043599998, "2": 1.5730157723647414e-07, "1": 0}, "score": 4.767902188484825}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9005945613962896, "5": 0.09393426968290716, "3": 0.00546659687319538, "2": 4.509009732801202e-06, "1": 4.639180544963034e-08}, "score": 4.088458517087315}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "human", "scores": {"3": 0.8393276871955616, "2": 0.10310482395144642, "4": 0.05734796040684641, "5": 0.00014296953390757988, "1": 7.648965920954603e-05}, "score": 2.9543760930452025}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.962885050839242, "4": 0.036837972661986094, "3": 0.00027405629951509367, "2": 2.6079776075469855e-06, "1": 2.2688716806980066e-07}, "score": 4.962605180066421}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9325863045039051, "4": 0.06719597023447463, "3": 0.00021667803844266581, "2": 8.849851249905668e-07, "1": 4.476971189225665e-08}, "score": 4.932367831709778}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9823461183989617, "4": 0.017616047545680098, "3": 3.758919183827959e-05, "2": 2.580847029235892e-07, "1": 3.755433572584069e-08}, "score": 4.98230785049752}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9485931402605718, "4": 0.0512256600310609, "3": 0.00017999688730024527, "2": 1.066213468918146e-06, "1": 9.06887974120437e-08}, "score": 4.948410782429827}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "human", "scores": {"4": 0.811457910231874, "5": 0.12409172116450953, "3": 0.06436922067182443, "2": 7.954202974231091e-05, "1": 1.266850067816135e-06}, "score": 4.059559636076809}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9994586692723768, "4": 0.0005395080781375308, "3": 1.7354861189096655e-06, "2": 4.7038241976360035e-09, "1": 0}, "score": 4.999457006793377}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9968654715244383, "4": 0.0031233754092891476, "3": 1.1139747386265821e-05, "2": 1.4240326540651069e-08, "1": 0}, "score": 4.996854302377857}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9971714313599198, "4": 0.002824233439655475, "3": 4.343135522873977e-06, "2": 1.0987022866472193e-08, "1": 3.632735104766496e-09}, "score": 4.997167032861188}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7254352423355882, "4": 0.27377209192820157, "3": 0.0007881244887002021, "2": 4.421670465068683e-06, "1": 1.9794551913461208e-07}, "score": 4.724637623880655}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5508881252049436, "5": 0.44447085243622536, "3": 0.00463311199276672, "2": 7.646978159451204e-06, "1": 2.0368360560324152e-07}, "score": 4.439821861695579}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8957470778864952, "5": 0.09474676292340488, "3": 0.009483094423464917, "2": 2.2356107679203645e-05, "1": 5.964478654395679e-07}, "score": 4.085217176503297}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8852978295703133, "4": 0.11411020351942294, "3": 0.000591669118966112, "2": 2.6103926508503226e-07, "1": 2.8053175579366925e-08}, "score": 4.884705561909217}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6651086953692308, "5": 0.33348219611967045, "3": 0.001408100001465843, "2": 8.897484985980641e-07, "1": 5.616505896501794e-08}, "score": 4.332072168912445}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9317031720020481, "4": 0.06822049814368823, "3": 7.61720469880612e-05, "2": 7.123397182117778e-08, "1": 0}, "score": 4.931626938141138}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9215046967797562, "4": 0.07840810318619226, "3": 8.663410480529693e-05, "2": 3.8534569363084244e-07, "1": 1.4204143871219758e-07}, "score": 4.921416901372604}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5678106605128616, "4": 0.43172046583692064, "3": 0.00046802099590877795, "2": 7.523636896906818e-07, "1": 6.431158827079722e-08}, "score": 4.5673409622671866}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.589885752891385, "4": 0.4085754016306544, "3": 0.0015378483728229215, "2": 9.294228823843527e-07, "1": 4.0016058535893656e-08}, "score": 4.588345941901915}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9558153013699143, "4": 0.04416506001078213, "3": 1.956205182168405e-05, "2": 4.813145131616015e-08, "1": 1.0086116123730345e-08}, "score": 4.95579563033561}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8385258662112302, "4": 0.16133495650545518, "3": 0.00013901927018750032, "2": 1.51749151265656e-07, "1": 1.799318071497104e-08}, "score": 4.838386479629592}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7482717236959026, "5": 0.24547229240770962, "3": 0.006250858279137467, "2": 4.805631973735668e-06, "1": 1.9170655373976094e-07}, "score": 4.23921127843068}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "claude", "scores": {"2": 0.6931843207840472, "3": 0.2745855524790908, "4": 0.029219990435114595, "1": 0.0025947674007602995, "5": 0.00041538016367897833}, "score": 2.3316769027040216}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9044530252406167, "4": 0.09499249409778603, "3": 0.0005533856065915584, "2": 9.218106529907469e-07, "1": 7.28056700117388e-08}, "score": 4.903897668381999}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9864877492450222, "4": 0.0134933271624426, "3": 1.8736782265106704e-05, "2": 8.253750837142578e-08, "1": 1.672584013343988e-08}, "score": 4.986468883572533}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.965636582640942, "4": 0.03430247053996034, "3": 6.080223559582294e-05, "2": 5.940918457832024e-08, "1": 0}, "score": 4.965575743829232}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7924445057283958, "5": 0.16309687982167365, "3": 0.04241040694692242, "2": 0.0018873774615154023, "1": 0.00016003148193369075}, "score": 4.1164317164835795}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6155840420187595, "4": 0.3824195020578671, "3": 0.0019429652372951957, "2": 4.579493786123363e-05, "1": 6.9616154894379645e-06}, "score": 4.61352905247103}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9745840367409188, "4": 0.02475826268061731, "1": 0.0005743827913660458, "3": 6.685676920043101e-05, "2": 9.883103263759028e-06}, "score": 4.972780664259259}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9820351538995824, "4": 0.01783090662696886, "3": 9.441505656694501e-05, "1": 3.49775545767989e-05, "2": 3.6896941113539576e-06}, "score": 4.9818292683838825}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6777692148938044, "5": 0.31244160227142664, "3": 0.009428134763930156, "2": 0.00031719240892501055, "1": 4.296705064804423e-05}, "score": 4.302250450120858}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7406946032519757, "4": 0.2587092331134757, "3": 0.0005950697097723478, "2": 1.0116337092491778e-06, "1": 6.990092182677301e-08}, "score": 4.740097309741932}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.6416126155390061, "4": 0.30536777778472274, "2": 0.04984667923194008, "5": 0.002998978644842613, "1": 0.00017370258549462243}, "score": 3.261171714975609}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt35", "scores": {"3": 0.7569197664495598, "4": 0.24128692342686955, "2": 0.0014981024575465853, "5": 0.00029387325177339976, "1": 1.1824701027341866e-06}, "score": 3.2403742390561234}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9669213837062837, "4": 0.03305923587947165, "3": 1.926666803371478e-05, "2": 3.0966991192677194e-08, "1": 0}, "score": 4.966902135143672}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5761634449179371, "5": 0.4220144769355787, "3": 0.0018190352515541272, "2": 2.937011471203664e-06, "1": 8.054611172975146e-08}, "score": 4.420189336669229}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "human", "scores": {"5": 0.92606934549151, "4": 0.07383716377054385, "3": 9.331795732324303e-05, "2": 6.590503465167069e-08, "1": 0}, "score": 4.925975994688347}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6784467871331218, "5": 0.31873335610945835, "3": 0.0028182659345422447, "2": 1.6061091192650365e-06, "1": 5.174572587496175e-08}, "score": 4.315911701543316}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9572366413102388, "4": 0.0424483388037466, "3": 0.0003138093255419503, "2": 9.346048661758766e-07, "1": 1.9318433504555999e-07}, "score": 4.956920462427484}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9856857383161743, "4": 0.014303271380679092, "3": 1.0903442422624122e-05, "2": 3.964079786152e-08, "1": 1.006935685181362e-08}, "score": 4.985674762002463}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6555546551011538, "4": 0.3432409501044687, "3": 0.001200822428325596, "2": 3.384095146627059e-06, "1": 1.286796312777146e-07}, "score": 4.6543467174369955}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "human", "scores": {"5": 0.771234709165939, "4": 0.22826633404190727, "3": 0.0004984521306268663, "2": 5.12443692634513e-07, "1": 2.5665786411622918e-08}, "score": 4.770735129371057}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8726946545655638, "3": 0.0663743694020003, "5": 0.06053884826097943, "2": 0.0003899867865716714, "1": 1.9068955590368798e-06}, "score": 3.993378783049203}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9841739609224305, "4": 0.015791065082703216, "3": 3.489063858933544e-05, "2": 7.576556008409572e-08, "1": 8.098597001191488e-09}, "score": 4.984138893957106}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9079327145909504, "4": 0.0919651479809432, "3": 0.00010182784140820784, "2": 1.7234561271140415e-07, "1": 2.628690317320899e-08}, "score": 4.907830563925205}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.700366856854933, "4": 0.2989038288415351, "3": 0.0007265974119841426, "2": 2.5851991819334207e-06, "1": 1.7180443720397717e-07}, "score": 4.699634545567482}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5037183633380461, "3": 0.49184518826648116, "5": 0.00322536873124633, "2": 0.0012089365380511807, "1": 2.0659817929734922e-06}, "score": 3.5089560715620034}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9988685200067556, "4": 0.001130865511566978, "3": 5.969437196146229e-07, "1": 0, "2": 0}, "score": 4.99886794058114}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9969549220831351, "4": 0.003039029676124188, "3": 6.060131854205721e-06, "2": 7.001418959035745e-09, "1": 0}, "score": 4.996948829113555}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9407502855257498, "4": 0.059157872712062715, "3": 9.151972821646012e-05, "2": 2.633373308040839e-07, "1": 1.9311443293106155e-08}, "score": 4.940658218236551}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.976524664421748, "4": 0.023445610197840177, "3": 2.9572313177105597e-05, "2": 6.979433436698101e-08, "1": 1.7914417524554092e-08}, "score": 4.976494962598879}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8986826950850247, "5": 0.08830011226223863, "3": 0.012981409285326444, "2": 3.462979913099708e-05, "1": 1.0600197690150605e-06}, "score": 4.0752462703585195}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8821981132508444, "5": 0.11150216179209538, "3": 0.006235166475788038, "2": 6.298550105774608e-05, "1": 1.4447706048081107e-06}, "score": 4.105136703481913}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8241401158674242, "5": 0.16905927261776274, "3": 0.006792515056705356, "2": 7.725376488443128e-06, "1": 3.0941915208376306e-07}, "score": 4.162250388555384}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.930330555468135, "4": 0.06963320096660118, "3": 3.598332216668364e-05, "2": 1.0722300633515778e-07, "1": 0}, "score": 4.930294500053705}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8959807191899096, "5": 0.09826877031664243, "3": 0.005735253655487953, "2": 1.4967535535085974e-05, "1": 2.1334612289232976e-07}, "score": 4.092502948577898}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9023469298268708, "5": 0.08612894027859357, "3": 0.011512755320156855, "2": 1.107149246106608e-05, "1": 1.6959611850904492e-07}, "score": 4.074593543142338}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9945880168344993, "4": 0.005407772545609264, "3": 4.179708711917253e-06, "1": 0, "2": 0}, "score": 4.994583867869548}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.59544848563451, "5": 0.4022617270092931, "3": 0.0022891545997294187, "2": 6.1440347451122e-07, "1": 0}, "score": 4.399971350943287}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9765061409010755, "4": 0.02346100260227804, "3": 3.279442587012875e-05, "2": 2.5228134923363032e-08, "1": 6.924659193632063e-09}, "score": 4.976473304459069}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8465048821257523, "5": 0.1404708619461346, "3": 0.013003720111944471, "2": 2.035155980741568e-05, "1": 1.443371434389585e-07}, "score": 4.127426010789892}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8238985710790014, "4": 0.17278485001155042, "3": 0.0032909500068676167, "2": 2.376242515180078e-05, "1": 1.5275628516562934e-06}, "score": 4.820555791631594}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9966730091401436, "4": 0.0033211837778919524, "3": 5.790013122351422e-06, "2": 1.6546272286168535e-08, "1": 0}, "score": 4.996667186555304}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9863870655518113, "4": 0.013501682117547978, "3": 0.00011113331958788457, "2": 8.679524481657024e-08, "1": 0}, "score": 4.986275790415405}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8974571172356905, "4": 0.10205092761078306, "3": 0.0004910892867306135, "2": 7.86909963323042e-07, "1": 0}, "score": 4.896964524950511}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6522326340523019, "4": 0.34019615542845555, "3": 0.007557298454067813, "2": 1.3399797005036856e-05, "1": 4.543268336498983e-07}, "score": 4.644647210375444}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9286343712759136, "4": 0.06976923679230665, "3": 0.0015761572730200186, "2": 1.8309655762013488e-05, "1": 1.6733817150001938e-06}, "score": 4.927016807803383}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8290926076612518, "4": 0.1673094478632823, "3": 0.0035690922044291345, "2": 2.809359341408793e-05, "1": 7.389216080808145e-07}, "score": 4.8254651278130725}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7646012522016034, "4": 0.23376734742129354, "3": 0.0016247927659159762, "2": 6.223967455337945e-06, "1": 3.7078220323394376e-07}, "score": 4.762962908967036}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9897713798166009, "4": 0.010136444331062765, "3": 9.160799577258726e-05, "2": 4.949678628602453e-07, "1": 6.115201644307479e-08}, "score": 4.9896786100445985}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9339422065717023, "4": 0.06570460924607177, "3": 0.0003489069465884446, "2": 3.899976618901914e-06, "1": 3.070276586791363e-07}, "score": 4.933584644155821}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9008453308348678, "3": 0.07236780940078855, "5": 0.026739163246517213, "2": 4.7359790071985765e-05, "1": 2.1991713953882847e-07}, "score": 3.954275969173114}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7867795375393092, "5": 0.11207455046142309, "3": 0.10078675810301987, "2": 0.00035631706195959553, "1": 2.711599163172172e-06}, "score": 4.010567024760356}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8579715744968802, "3": 0.07839753448622916, "5": 0.06348510293849584, "2": 0.00014459873450098533, "1": 8.299353755252749e-07}, "score": 3.984795875712646}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.6871884608489505, "5": 0.3066721246480987, "3": 0.006125511596991643, "2": 1.329652280701958e-05, "1": 4.2134283488958576e-07}, "score": 4.300518811585085}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6844024891427556, "5": 0.31026763973337257, "3": 0.005321867518051558, "2": 7.73715893815774e-06, "1": 1.8503700589628176e-07}, "score": 4.304929767610722}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7479977417971383, "4": 0.2513817195671127, "3": 0.0006181873445037411, "2": 2.131177316907361e-06, "1": 0}, "score": 4.747375456605748}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5383006531818121, "4": 0.4606279553972316, "3": 0.0010705411614462435, "2": 7.653045329852231e-07, "1": 4.802414171888269e-08}, "score": 4.537228457179171}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9338930264700277, "4": 0.06598799153165882, "3": 0.000118709408101406, "2": 1.6930788072719336e-07, "1": 0}, "score": 4.933774074888528}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9855515345116103, "4": 0.01442760346544372, "3": 2.045774537987339e-05, "2": 1.7330686978712578e-07, "1": 0}, "score": 4.985530957781263}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9479472895627552, "5": 0.05041964994636673, "3": 0.001632371032392838, "2": 7.148529355169915e-07, "1": 0}, "score": 4.048785847969214}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5571344977894094, "5": 0.4409869702015565, "3": 0.0018763657213184209, "2": 2.0505797498311752e-06, "1": 1.0178867363223114e-07}, "score": 4.439106204066766}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6247535793698589, "5": 0.3736798366227619, "3": 0.0015654508709940838, "2": 1.150724285914407e-06, "1": 3.9856513285875146e-08}, "score": 4.372111943357904}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7691879200146272, "5": 0.22768832063580702, "3": 0.003122323009115606, "2": 1.3578554198450578e-06, "1": 6.877001606568241e-08}, "score": 4.224563077787437}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9810017956404986, "4": 0.018993290381487237, "3": 4.971216396573924e-06, "2": 1.2136334896329278e-08, "1": 0}, "score": 4.980996732095062}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6938769983433184, "4": 0.3057955614941896, "3": 0.0003268966474073222, "2": 4.875870491938319e-07, "1": 2.896206403621133e-08}, "score": 4.693549058337844}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8127596309804864, "3": 0.13106607416504887, "5": 0.05608147695667407, "2": 9.224799589454527e-05, "1": 4.165805486167145e-07}, "score": 3.9248296455329696}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7454785931088632, "5": 0.25206363588404074, "3": 0.002455794364529606, "2": 1.8545063795220657e-06, "1": 9.562581709996341e-08}, "score": 4.249603852246391}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9623748088568723, "4": 0.0375906323219717, "3": 3.445205192048978e-05, "2": 2.995669494410297e-08, "1": 0}, "score": 4.962340370811371}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.998083789180683, "4": 0.0019143445241147515, "3": 1.8382601579587407e-06, "2": 7.71406925012598e-09, "1": 0}, "score": 4.998081955774385}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5517562534845774, "5": 0.4438664278439943, "3": 0.004362491237725092, "2": 1.4440215511382324e-05, "1": 2.973892351833427e-07}, "score": 4.43947420348505}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.691440967697062, "4": 0.30717990292949343, "3": 0.0013779147132457238, "2": 1.0581335539795177e-06, "1": 7.568347471527246e-08}, "score": 4.690060765452984}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8464324498020499, "5": 0.15171471449520182, "3": 0.0018515108453978025, "2": 1.3274337379385335e-06, "1": 1.8998800335694565e-08}, "score": 4.149860488552659}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5894683617973119, "4": 0.4092843222617771, "3": 0.0012468224551588465, "2": 4.776135042678809e-07, "1": 4.599629441029893e-08}, "score": 4.588220428406682}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5376382461024642, "4": 0.46146373908022353, "3": 0.0008968786404376218, "2": 1.0908056568761747e-06, "1": 3.2176161006407716e-08}, "score": 4.536739096404532}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8631429055572604, "4": 0.1366633604600842, "3": 0.00019332719376192494, "2": 3.5178065316538893e-07, "1": 5.043774668619128e-08}, "score": 4.8629487274330545}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9033235356312392, "5": 0.06902030101842996, "3": 0.02762424913906365, "2": 3.139317642409973e-05, "1": 3.3396721749481027e-07}, "score": 4.041332271356795}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.731786744585399, "4": 0.2665320979605936, "3": 0.001679395620491265, "2": 1.6589096645277005e-06, "1": 1.0349598678675053e-07}, "score": 4.7301037202399}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5558777739072619, "5": 0.44277714243376176, "3": 0.0013450253749129702, "2": 1.416277075557318e-07, "1": 0}, "score": 4.4414317970129}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7563831870772999, "5": 0.23882961243022438, "3": 0.004776744650256466, "2": 9.779042329804835e-06, "1": 4.187693692296843e-07}, "score": 4.234032113774628}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8672245406301735, "5": 0.11598103414420555, "3": 0.016771963934764742, "2": 2.189277246589954e-05, "1": 4.4308509380885523e-07}, "score": 4.09916396784769}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5036566666544113, "5": 0.4934122734218363, "3": 0.002929032837603, "2": 1.8954050416007186e-06, "1": 6.347834581452822e-08}, "score": 4.490479292791155}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7257146394746302, "5": 0.2673648430390115, "3": 0.006917021645842509, "2": 3.3427056635677383e-06, "1": 1.1158602710392326e-07}, "score": 4.260440812044771}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5739567522576371, "4": 0.4247699503091968, "3": 0.0012725684744814094, "2": 5.718906701138816e-07, "1": 3.723777998635244e-08}, "score": 4.572682996913214}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9866695569452788, "4": 0.013312449885354388, "3": 1.77955523476148e-05, "2": 8.981606321161896e-08, "1": 3.382008432946273e-08}, "score": 4.986651553293894}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8947867296472464, "4": 0.1050305729767059, "3": 0.00018169556340570783, "2": 6.736123768524288e-07, "1": 1.4277698064500346e-07}, "score": 4.89460342440845}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6571142099926063, "4": 0.3414894478032287, "3": 0.0013949585184905436, "2": 1.1809209001536814e-06, "1": 1.3196831249953437e-07}, "score": 4.655716540149788}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9205508942953554, "4": 0.07932583620991647, "3": 0.00012305071136975928, "2": 1.7487437114376958e-07, "1": 2.598659522877269e-08}, "score": 4.920427432371719}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8135434520852248, "4": 0.1859428891496915, "3": 0.0005128979297187449, "2": 5.993884209409128e-07, "1": 5.680014263743559e-08}, "score": 4.8130292700591495}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6243662335738797, "4": 0.37503564657352756, "3": 0.0005978336619385216, "2": 2.6865575448326483e-07, "1": 1.802925717445568e-08}, "score": 4.623767808204297}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7348688875260313, "4": 0.26423785910966396, "3": 0.0008899655534285263, "2": 2.9844890449284904e-06, "1": 2.449499335847134e-07}, "score": 4.733972260988066}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8534498726411981, "3": 0.14059547269743436, "5": 0.005876705283783366, "2": 7.736175661947961e-05, "1": 4.013640364056701e-07}, "score": 3.86512527985965}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5448101683220866, "4": 0.4478384429593095, "3": 0.007345253181785481, "2": 5.04697754395919e-06, "1": 7.911873857124712e-07}, "score": 4.537452607446354}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8130464475568561, "5": 0.18375472994926512, "3": 0.0031978335950255737, "2": 7.919583776382707e-07, "1": 3.750550930353612e-08}, "score": 4.180555228707774}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9469625618489164, "4": 0.05298335348255099, "3": 5.372011744866061e-05, "2": 1.819166903493926e-07, "1": 3.654578422808301e-08}, "score": 4.946908506593282}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.634852474946178, "4": 0.36473482364426285, "3": 0.0004121415498596822, "2": 5.0981037198875e-07, "1": 1.9949874187926988e-08}, "score": 4.634439273022227}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9495493455911445, "3": 0.03914155846896264, "5": 0.011279714990850582, "2": 2.9146491867755163e-05, "1": 2.2667263429927945e-07}, "score": 3.9720791833028994}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9651798258236512, "4": 0.03479987792883355, "3": 2.0216084662326623e-05, "2": 3.97397059180439e-08, "1": 9.467196629735336e-09}, "score": 4.965159531735417}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9711671018146134, "4": 0.028807235233676606, "3": 2.5565954344749507e-05, "2": 2.4608350509575418e-08, "1": 7.37743367001793e-09}, "score": 4.971141527646712}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9293068530726999, "4": 0.07054770721046506, "3": 0.0001447271952053335, "2": 5.380491091513577e-07, "1": 7.60814013083068e-08}, "score": 4.929160912956254}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9720115284954572, "4": 0.027961740888992833, "3": 2.6565796910453063e-05, "2": 8.371413472940497e-08, "1": 3.610559490854822e-08}, "score": 4.971984730691745}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9165067470250636, "5": 0.06355383099504874, "3": 0.019917058567558318, "2": 2.1857094457332758e-05, "1": 3.171306509092728e-07}, "score": 4.043592115093694}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8893526059421926, "3": 0.07625044709277523, "5": 0.034098451714170364, "2": 0.00029702893490037144, "1": 1.3852152711081897e-06}, "score": 3.9572497876387094}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8300153370406395, "4": 0.16949007643190123, "3": 0.0004941675145390427, "2": 3.8860711144626295e-07, "1": 2.4822632478552272e-08}, "score": 4.8295203224753385}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9635139141270219, "4": 0.036451207263218766, "3": 3.4769047730350866e-05, "2": 7.452479113520694e-08, "1": 1.1114391909763362e-08}, "score": 4.9634789857356925}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7033222286176933, "4": 0.2963039184164049, "3": 0.00037296573716727585, "2": 7.479737149728508e-07, "1": 2.7437833260945083e-08}, "score": 4.702947763221236}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "human", "scores": {"4": 0.880467977718206, "3": 0.06611386474731985, "5": 0.053374439962193085, "2": 4.3218323394113374e-05, "1": 3.3156532099154213e-07}, "score": 3.9871731417212692}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9675722498682212, "5": 0.025332832431504616, "3": 0.0070879012342234, "2": 6.884383309140682e-06, "1": 1.2632915436300732e-07}, "score": 4.018230783548092}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.977869993270221, "4": 0.022085853246906637, "3": 4.409350787796743e-05, "2": 6.992077650780311e-08, "1": 0}, "score": 4.9778257501955485}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9646995406153999, "4": 0.03523266654084881, "3": 6.768093687814e-05, "2": 7.49162510498404e-08, "1": 0}, "score": 4.964631745528348}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9271465975592811, "4": 0.07269832024538755, "3": 0.00015443782033697998, "2": 5.622810629816997e-07, "1": 4.294528385571659e-08}, "score": 4.9269909426314085}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5695314350435835, "4": 0.42164282904318934, "2": 0.005718546581621083, "5": 0.003092736442098247, "1": 1.4371708089147807e-05}, "score": 3.4220810461947244}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9591148280387012, "4": 0.0408473839548394, "3": 3.7528459230623476e-05, "2": 1.6744263867571435e-07, "1": 3.4906492273845096e-08}, "score": 4.959076914832092}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8155931329067757, "5": 0.1805617056631953, "3": 0.00383940988489666, "2": 5.305455113711519e-06, "1": 1.2641875349258888e-07}, "score": 4.176711362101356}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6119771706653343, "4": 0.3874702140929681, "3": 0.0005510731494502029, "2": 1.3373226033261026e-06, "1": 1.25330824463931e-07}, "score": 4.611423095448933}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7574892750868732, "4": 0.24215336836210863, "3": 0.00035615141304214267, "2": 1.0003746281198664e-06, "1": 0}, "score": 4.75713127795731}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5235002872296328, "5": 0.47263109064940717, "3": 0.0038633743246710046, "2": 4.818990941763506e-06, "1": 1.7308751557191795e-07}, "score": 4.468757678950003}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.844577362052335, "5": 0.12553426873931223, "3": 0.0298554164497974, "2": 3.244364414824893e-05, "1": 3.450429275411577e-07}, "score": 4.095612945559793}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7307430177103718, "4": 0.2684881768717364, "3": 0.0007679845056154519, "2": 6.981949326751258e-07, "1": 0}, "score": 4.729973726395327}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9012076786388643, "5": 0.08991382206411777, "3": 0.008830006749356729, "2": 4.721683760811185e-05, "1": 1.0311643059612346e-06}, "score": 4.080986307951484}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6669214740881552, "5": 0.33085230885274425, "3": 0.0022211117947826494, "2": 5.016415114418495e-06, "1": 9.692096348632341e-08}, "score": 4.328620870812293}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6438555109046449, "5": 0.3496617920864421, "3": 0.006468189756228195, "2": 1.3872237739347877e-05, "1": 5.573808937137247e-07}, "score": 4.343164212353283}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5289081984949482, "5": 0.4673014389477765, "3": 0.0037759257294494087, "2": 1.339311217433532e-05, "1": 1.0756698222067552e-06}, "score": 4.463495485173898}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6215591373148521, "4": 0.3757928944418179, "3": 0.002635490411196127, "2": 1.2003071291082765e-05, "1": 5.144327498159138e-07}, "score": 4.618898072909958}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9606974287537239, "4": 0.03920106751621557, "3": 0.00010100323620527007, "2": 3.2280868361453575e-07, "1": 6.364392247534178e-08}, "score": 4.9605956985159185}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.593728520670788, "4": 0.4025099346773204, "3": 0.003750727716849758, "2": 1.0059651862548348e-05, "1": 6.712951035568018e-07}, "score": 4.58995571049406}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8350944639925979, "4": 0.16371754869739238, "3": 0.0011817427775098759, "2": 5.660337718215378e-06, "1": 3.8783726709720825e-07}, "score": 4.83390040077046}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6712519017607148, "4": 0.32473675807933816, "3": 0.00396551161274939, "2": 4.401892072497043e-05, "1": 1.6837636539576288e-06}, "score": 4.667193384990394}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9303082743181494, "4": 0.06900629821998527, "3": 0.0006764723387196299, "2": 7.400781168609192e-06, "1": 1.340108469351861e-06}, "score": 4.929613179245978}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9820338860930171, "4": 0.017843952922524525, "3": 0.00011816956186348074, "2": 2.6321093473985416e-06, "1": 0}, "score": 4.981911787038159}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8260546214368313, "4": 0.17152401380358406, "3": 0.0023686620952661887, "2": 4.321292144131817e-05, "1": 9.414598890520834e-06}, "score": 4.823571351588446}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6329960860705295, "3": 0.3653410419999752, "5": 0.0009404923906551919, "2": 0.0007217264997848652, "1": 6.63361331828543e-07}, "score": 3.6341540110834782}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8308319672901319, "4": 0.16865374701869518, "3": 0.0005134381416600275, "2": 7.839924082480232e-07, "1": 2.6956806801445593e-08}, "score": 4.83031691068308}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8926748447797505, "4": 0.10721844323938363, "3": 0.00010657943311268066, "2": 1.0469756251499429e-07, "1": 0}, "score": 4.892568080809704}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.82522514239923, "4": 0.17425113774147138, "3": 0.0005215672170889722, "2": 1.8856310849840802e-06, "1": 1.4014040836911883e-07}, "score": 4.824699488128962}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7242029776634834, "4": 0.2746882941509046, "3": 0.001105471100028376, "2": 3.056650039557882e-06, "1": 1.3514764357541054e-07}, "score": 4.72309103502954}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7759003205105711, "4": 0.17079316773146003, "2": 0.05256223410007155, "5": 0.0006971078671468685, "1": 4.699167968050009e-05}, "score": 3.119531187296149}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.5028268010936404, "4": 0.45951835150359993, "2": 0.02607968031132909, "5": 0.011450402462915657, "1": 0.0001246596293344589}, "score": 3.4560902047485307}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9982807219547003, "4": 0.0017153308526040986, "3": 3.89391686793695e-06, "2": 3.324960332469744e-08, "1": 0}, "score": 4.998276781530341}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9301119813776993, "4": 0.06984626265553719, "3": 4.149477675392628e-05, "2": 1.2261591616131476e-07, "1": 0}, "score": 4.93007037025277}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.798851138768322, "4": 0.2008885303761146, "3": 0.00025992355224783704, "2": 3.6452416186469257e-07, "1": 1.4795984656203868e-08}, "score": 4.798590464126888}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9629687320748377, "4": 0.03675428725968764, "3": 0.0002756634004794792, "2": 1.116781131754488e-06, "1": 1.0987637135195785e-07}, "score": 4.9626905927099605}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8265858957655952, "4": 0.1729303442424625, "3": 0.0004810200041759072, "2": 2.6724149999429322e-06, "1": 6.07558781339535e-08}, "score": 4.826099354295212}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9789039799362618, "4": 0.02103434922796746, "3": 6.13753051480271e-05, "2": 2.5240068306583315e-07, "1": 2.1025013268616768e-08}, "score": 4.9788420583919395}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9945606538070154, "4": 0.00543275992870972, "3": 6.563667769817954e-06, "2": 3.537027708008079e-08, "1": 1.0414570517517157e-08}, "score": 4.994553965092922}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6976533031321513, "3": 0.2396276544885154, "5": 0.05189047664310228, "2": 0.010764621597155771, "1": 6.386660159267365e-05}, "score": 3.790541962914648}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6073716693201628, "3": 0.3916358597981619, "5": 0.0009367644450684777, "2": 5.559156927219806e-05, "1": 9.049719329829155e-08}, "score": 3.609189440492674}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8012791746423719, "4": 0.1984061870281308, "3": 0.0003134235773553018, "2": 1.0852382606610642e-06, "1": 7.794651114853135e-08}, "score": 4.800963388052537}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9498559855851456, "4": 0.050073152137915654, "3": 7.071654467939389e-05, "2": 3.338871060296092e-08, "1": 5.7370425189387094e-09}, "score": 4.949785286305208}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9830805884980065, "4": 0.01690374641939235, "3": 1.5602287809599365e-05, "2": 4.974952107606017e-08, "1": 0}, "score": 4.983064899535503}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9951064466379335, "4": 0.004889601850382081, "3": 3.947014845814147e-06, "2": 9.045603485338295e-09, "1": 2.9613784039328135e-09}, "score": 4.995102465174383}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6138378154165238, "5": 0.37206866812874945, "3": 0.014072461168764266, "2": 2.05783706956501e-05, "1": 4.212059207180046e-07}, "score": 4.357953806542204}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9160714730544157, "4": 0.08326171827227662, "3": 0.0006659437835970265, "2": 7.874491813089931e-07, "1": 5.056359429192322e-08}, "score": 4.915403827284923}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.58023557158285, "4": 0.4179232147926424, "3": 0.0018389559258771106, "2": 2.0845907603253003e-06, "1": 8.743064381534863e-08}, "score": 4.578392233738563}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9946619506912333, "4": 0.005322786683939617, "3": 1.516194329923194e-05, "2": 6.571898422489714e-08, "1": 2.0509554217166714e-08}, "score": 4.994646610156922}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8587178536780854, "4": 0.14100293122362753, "3": 0.00027887106934357963, "2": 2.5538005234010483e-07, "1": 9.725680262663542e-09}, "score": 4.85843851042232}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6548263061264818, "5": 0.254270224879968, "3": 0.09043177318960063, "2": 0.0004598431982321728, "1": 1.1851750260285256e-05}, "score": 4.162883210182461}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9549157569597112, "4": 0.04415607775110271, "3": 0.0009271337687040062, "2": 9.410467663788044e-07, "1": 4.217374356280962e-08}, "score": 4.953986660653772}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9914864096247387, "4": 0.008455700920071675, "3": 5.7708273875936155e-05, "2": 6.112853857679944e-08, "1": 0}, "score": 4.991428698117552}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9827358924106941, "4": 0.017230236542684494, "3": 3.385003583383175e-05, "2": 6.417616223191635e-08, "1": 0}, "score": 4.982701871603842}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8248185468917628, "4": 0.17286398631124378, "3": 0.002314824509844632, "2": 2.495071928794982e-06, "1": 1.1818933080092677e-07}, "score": 4.822498401543815}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9476949767351376, "4": 0.05226174650035707, "3": 4.3061251601357587e-05, "2": 1.0754623379751804e-07, "1": 3.654666133742974e-08}, "score": 4.947651658432375}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8729673007758418, "5": 0.12612704328044327, "3": 0.0009043763209116691, "2": 1.3423147619620932e-06, "1": 2.3985820348816045e-08}, "score": 4.125219899518765}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9996180205027515, "4": 0.0003811422091944803, "3": 7.870646063240119e-07, "1": 1.130523436883167e-08, "2": 0}, "score": 4.999617238425758}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9999318626214566, "4": 6.803760438348174e-05, "3": 4.3779113238587904e-08, "1": 1.7403841016613656e-09, "2": 0}, "score": 4.999931867872157}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9982144363189748, "4": 0.0017829250087773934, "3": 2.567217321343876e-06, "2": 1.3331515743905237e-08, "1": 0}, "score": 4.998211900458101}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "human", "scores": {"4": 0.87635535842599, "5": 0.10983884861069751, "3": 0.013792854648597449, "2": 1.2794617286194341e-05, "1": 1.6570180821341837e-07}, "score": 4.096019905509243}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9032844496674834, "4": 0.09664592854289068, "3": 6.942184295403939e-05, "2": 1.3078317992994056e-07, "1": 0}, "score": 4.903214828727662}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9203499047469146, "4": 0.07953513541893656, "3": 0.00011479794212269199, "2": 7.70498671027556e-08, "1": 0}, "score": 4.920235030779785}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9608200071545877, "4": 0.039134568410850855, "3": 4.5040251059642804e-05, "2": 2.8000902560306886e-07, "1": 0}, "score": 4.9607745069736575}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9361158863176143, "4": 0.06380563306334693, "3": 7.8154571994446e-05, "2": 2.4841353491148675e-07, "1": 0}, "score": 4.936037307586411}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9454458413101443, "3": 0.030848298010209326, "5": 0.02367094103035473, "2": 3.433181783860942e-05, "1": 2.6332179435989604e-07}, "score": 3.992753187067425}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8888046081348356, "4": 0.11105189104676179, "3": 0.00014296281449739355, "2": 3.7108970912400507e-07, "1": 5.2509275855159986e-08}, "score": 4.888660847280266}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6862443220996888, "4": 0.31335965205294564, "3": 0.0003954934627382498, "2": 5.452524164795674e-07, "1": 3.365110309387354e-08}, "score": 4.685847605273938}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9961218394639774, "4": 0.003876233671523589, "3": 1.9359778699232298e-06, "2": 6.13935591577887e-09, "1": 3.632037686580675e-09}, "score": 4.996119861499793}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7515749807368585, "4": 0.24763992579000613, "3": 0.0007818276016277462, "2": 2.994722455419325e-06, "1": 1.665382207192502e-07}, "score": 4.750786742616083}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6827811468289197, "4": 0.3161286272365329, "3": 0.0010871203058634643, "2": 2.7623107507028155e-06, "1": 1.4265217675388442e-07}, "score": 4.681688210736506}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.611262052864335, "4": 0.38793606649920503, "3": 0.0007999934642637752, "2": 1.7880033636119221e-06, "1": 6.509930263508106e-08}, "score": 4.610458308893464}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6076901309354087, "4": 0.39173211222039944, "3": 0.0005775673494176271, "2": 1.6760681289384407e-07, "1": 0}, "score": 4.607112241660814}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9653134420192317, "4": 0.0346707252792042, "3": 1.5818664779133827e-05, "2": 2.163263030262378e-08, "1": 0}, "score": 4.965297572756941}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8280214161631735, "5": 0.16191098015485839, "3": 0.010055230822791222, "2": 1.2148729032839505e-05, "1": 1.6496788802775178e-07}, "score": 4.151830965953}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5582703699438184, "5": 0.43945361843366515, "3": 0.0022755261012896905, "2": 4.814781431446051e-07, "1": 1.608547734965139e-08}, "score": 4.437177075854998}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9939239649156737, "4": 0.006068907946885503, "3": 7.105780146357922e-06, "2": 1.3653034941400244e-08, "1": 7.3024640839590394e-09}, "score": 4.993916810321417}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9934669934881196, "4": 0.006524049544901391, "3": 8.950295584694624e-06, "2": 1.440463222213988e-08, "1": 5.154029505271936e-09}, "score": 4.993457986118224}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9967704741736069, "4": 0.003225419047391003, "3": 4.1047077962211965e-06, "2": 2.0396877735322412e-08, "1": 0}, "score": 4.996766310405643}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9435978310894078, "4": 0.05634498724224395, "3": 5.7008111114446386e-05, "2": 7.216526507168855e-08, "1": 1.3753974500778367e-08}, "score": 4.943540720075856}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "human", "scores": {"4": 0.760507488895434, "3": 0.22473397716160992, "5": 0.014222152425397776, "2": 0.0005320380758697416, "1": 4.100953706345687e-06}, "score": 3.78841174494332}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8500839497184565, "5": 0.07537098442355261, "3": 0.07442244518842703, "2": 0.00012155496629437416, "1": 9.417744767530381e-07}, "score": 4.00070260406618}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9369265015516274, "5": 0.052964748995947, "3": 0.010099115835565315, "2": 9.46716558701758e-06, "1": 6.214273005544037e-08}, "score": 4.042846516870275}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.730886520497972, "5": 0.26392611036288666, "3": 0.005180631080080823, "2": 6.3855367998069965e-06, "1": 1.9316443808376155e-07}, "score": 4.258732169946887}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9419046785733747, "3": 0.04188580886480914, "5": 0.016182578769232334, "2": 2.6874383804068788e-05, "1": 1.0705437007473943e-07}, "score": 3.974242701200926}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9062198611756791, "5": 0.08051416075725192, "3": 0.013244158389878398, "2": 2.1045643055409383e-05, "1": 4.303121333839918e-07}, "score": 4.0672266432521385}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7689426112689254, "5": 0.2252184857864501, "3": 0.005829906013110662, "2": 8.810617761380452e-06, "1": 1.8501017747553432e-07}, "score": 4.21937040379325}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5875874282458757, "5": 0.40874945095538173, "3": 0.003654664434432426, "2": 8.235882792660348e-06, "1": 1.4995148927351694e-07}, "score": 4.405077893471052}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9861048335228502, "4": 0.013886199135708413, "3": 8.850735456215658e-06, "2": 2.1932462318374594e-08, "1": 0}, "score": 4.986096032279654}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6471727749641785, "4": 0.3518523329736409, "3": 0.0009721426548730227, "2": 2.329797975359797e-06, "1": 8.937793475962657e-08}, "score": 4.646195917973732}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6169764835405211, "4": 0.3826979665482712, "3": 0.00032540662624602144, "2": 9.881652392225516e-08, "1": 9.685712261936549e-09}, "score": 4.6166508716728885}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8526228539517604, "5": 0.1390247366741799, "3": 0.008310728570590292, "2": 4.1316319118574856e-05, "1": 2.6445096245018447e-07}, "score": 4.130630595179886}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8135825112439671, "4": 0.1858107121623148, "3": 0.0006059830758046772, "2": 7.035900258955001e-07, "1": 2.3045622471692136e-08}, "score": 4.812975106224859}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8978027191119969, "4": 0.10215879117421416, "3": 3.80146099408776e-05, "2": 8.525423880210983e-08, "1": 0}, "score": 4.897764883986868}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9313365723610827, "3": 0.063834403127017, "5": 0.00371750066777445, "2": 0.0011072458092449109, "1": 4.111580719961916e-06}, "score": 3.937656260802733}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7778412923672489, "3": 0.22000533124314536, "5": 0.0016989463741070093, "2": 0.00045385558737794795, "1": 4.921447285461884e-07}, "score": 3.780784409484218}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8653176621382335, "5": 0.13120480233223397, "3": 0.0034755980988446194, "2": 1.9224272070049523e-06, "1": 4.5288486405335525e-08}, "score": 4.127725219645357}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6607048759485106, "5": 0.33723110909744547, "3": 0.00206170287357421, "2": 2.1824248124954087e-06, "1": 7.368180112956702e-08}, "score": 4.335164839089312}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8494994205308903, "3": 0.10558139573318577, "5": 0.04476118147989218, "2": 0.000156809949283159, "1": 1.1518848007958466e-06}, "score": 3.93886270772245}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9244199862819756, "3": 0.04968451320360114, "5": 0.025848259785594012, "2": 4.695828047107325e-05, "1": 2.1269321811336645e-07}, "score": 3.976069190272099}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9505170464708531, "4": 0.04934385201960245, "3": 0.0001385655581895622, "2": 3.5882752344172647e-07, "1": 1.5414363105656194e-07}, "score": 4.950377322666585}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9944229451354741, "4": 0.005572064764092207, "3": 4.9654084400183425e-06, "2": 1.3994618137345782e-08, "1": 0}, "score": 4.994417962375461}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9071646979139237, "4": 0.0925995682377649, "3": 0.00023536336593358754, "2": 2.822338088873865e-07, "1": 3.2608005866378566e-08}, "score": 4.90692872271838}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9463712424810424, "4": 0.05360733892690651, "3": 2.126451153279602e-05, "2": 3.073010635069148e-08, "1": 0}, "score": 4.946350033241963}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5865071206743935, "4": 0.41319801736234185, "3": 0.00029443685268105, "2": 3.1875884239866147e-07, "1": 2.4823799169695845e-08}, "score": 4.586212019625289}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9060877258297447, "5": 0.0596197311580606, "3": 0.03427168760243793, "2": 2.0428144001133654e-05, "1": 3.521216938258207e-07}, "score": 4.025306132804144}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8618555480753073, "5": 0.08629324995503942, "3": 0.05107832704592975, "2": 0.0007611916440050469, "1": 1.1645496723736422e-05}, "score": 4.033657604402614}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8725243648202876, "4": 0.12694422020362817, "3": 0.0005299057486330811, "2": 1.4147029192103218e-06, "1": 8.713606277759498e-08}, "score": 4.8719913747003085}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6157123615729952, "4": 0.3825641987231442, "3": 0.0017212939060697004, "2": 2.0974483992088185e-06, "1": 5.561254675980216e-08}, "score": 4.6139867014730065}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6061932193020062, "4": 0.3931864862270589, "3": 0.0006197952973539065, "2": 5.271213759646628e-07, "1": 6.053428125930012e-08}, "score": 4.605572134576777}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8288224421167066, "5": 0.1593916337321516, "3": 0.01177222541960587, "2": 1.3495651979364575e-05, "1": 2.7582589099894806e-07}, "score": 4.147591578794167}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.823029602447442, "5": 0.1746118968769762, "3": 0.002356564360665444, "2": 1.8263666534016065e-06, "1": 2.462427726410463e-08}, "score": 4.172251620607367}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8420347877295383, "4": 0.15775984036712434, "3": 0.00020508562153492854, "2": 1.8590463681634044e-07, "1": 1.3965902692549183e-08}, "score": 4.84182936114456}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9170647211413177, "5": 0.07325963528562926, "3": 0.009659040140810515, "2": 1.619835279850881e-05, "1": 2.7989928357587515e-07}, "score": 4.063567366698745}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8966281153608395, "5": 0.09068161895557772, "3": 0.012666722500491966, "2": 2.30609464738477e-05, "1": 4.982514338925728e-07}, "score": 4.077967278559205}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "human", "scores": {"4": 0.905311984894053, "5": 0.0761622001798657, "3": 0.018490973220563405, "2": 3.424660918687879e-05, "1": 4.837319045098755e-07}, "score": 4.057601288959949}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9205550220548199, "4": 0.0789622412211488, "3": 0.00047933539847421576, "2": 2.940114593477449e-06, "1": 3.4443101957375085e-07}, "score": 4.920068880579692}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6891888518172724, "4": 0.3084866223839783, "3": 0.0023192595586482975, "2": 4.6822724483356445e-06, "1": 5.165049317652848e-07}, "score": 4.6868587245362905}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9873363840227973, "4": 0.012593648240835418, "3": 6.891911412900259e-05, "2": 7.494932690733405e-07, "1": 1.9458281119522978e-07}, "score": 4.98726548538851}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7009043143863074, "4": 0.296080471035301, "3": 0.0030034609657886837, "2": 1.068408827922844e-05, "1": 1.0268763843874733e-06}, "score": 4.6978764343777994}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9559669238619884, "3": 0.033891673982419546, "5": 0.010116752154325469, "2": 2.4569345744775235e-05, "1": 8.698631756741524e-08}, "score": 3.9761756786722895}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8667545542779035, "5": 0.1283684672566268, "3": 0.004873419657052653, "2": 3.3966259048656115e-06, "1": 7.006096817823522e-08}, "score": 4.12348805554077}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7401464847566916, "5": 0.25782345789656647, "3": 0.002027587330309447, "2": 2.3979076820358368e-06, "1": 3.357110869959937e-08}, "score": 4.255790983895149}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6046646331610691, "4": 0.3947888318276922, "3": 0.0005455694207599169, "2": 8.887063241912036e-07, "1": 7.310105777859178e-08}, "score": 4.604117069309921}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9668906186911401, "5": 0.028710487639160745, "3": 0.004390250464963983, "2": 8.646923197565852e-06, "1": 3.880665827553818e-08}, "score": 4.024302825874345}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8675339608270046, "5": 0.1164129844090616, "3": 0.01603814550697556, "2": 1.4562075169117935e-05, "1": 2.0386557630086894e-07}, "score": 4.100345117536101}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9773870164474171, "4": 0.022586881631917917, "3": 2.6099301668232307e-05, "2": 2.21803294868838e-08, "1": 5.402251639534329e-09}, "score": 4.977360832179906}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6291719557955112, "4": 0.37039636128609876, "3": 0.0004313482454622896, "2": 3.2652934982615265e-07, "1": 2.2675200469318795e-08}, "score": 4.628739877329137}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9788401281122004, "4": 0.021131095562994424, "3": 2.8594619134207526e-05, "2": 1.216164009835385e-07, "1": 2.982499609180473e-08}, "score": 4.9788112304082865}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8314981377324075, "5": 0.161200040124234, "3": 0.007274127531921697, "2": 2.7008633062805377e-05, "1": 6.59356155517717e-07}, "score": 4.153869921354079}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7991404791174526, "5": 0.19466917492817906, "3": 0.006179786222125057, "2": 1.060946532611271e-05, "1": 1.0544914902421428e-07}, "score": 4.188467824181098}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7602901060886875, "4": 0.23876907679668902, "3": 0.0009310069645458396, "2": 8.38495105429098e-06, "1": 1.1736394454969423e-06}, "score": 4.759338999322695}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9938411797650232, "4": 0.0061439648756926885, "3": 1.4441825685177377e-05, "2": 2.0223569758956172e-07, "1": 0}, "score": 4.993826543461405}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9852788110101378, "4": 0.01470026732483313, "3": 2.0713435712705478e-05, "2": 1.7032831460558019e-07, "1": 0}, "score": 4.985257794260055}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9094995734663918, "4": 0.0900073180761759, "3": 0.0004897867331856289, "2": 2.8603859347960955e-06, "1": 2.3057238248702112e-07}, "score": 4.909003584011246}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8385669382140023, "4": 0.1612782249780761, "3": 0.00015476557581414478, "2": 5.3813202513775343e-08, "1": 0}, "score": 4.8384120796160035}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9385251830666723, "5": 0.05177630845882624, "3": 0.009695229680058107, "2": 3.048911244774261e-06, "1": 6.776249270604187e-08}, "score": 4.042074784489995}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8880991738166547, "4": 0.11186348892180019, "3": 3.723784407329206e-05, "2": 1.852010385542076e-08, "1": 0}, "score": 4.88806197077425}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9316636406751231, "4": 0.0683100485164009, "3": 2.6196886241610353e-05, "2": 2.0381565430633255e-08, "1": 0}, "score": 4.931637490171744}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5179184922356674, "5": 0.48146391184117654, "3": 0.0006171799027369463, "2": 3.6138932396377745e-07, "1": 0}, "score": 4.480846035428938}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7100177281735369, "5": 0.2713615539145457, "3": 0.0185863525769203, "2": 3.3489252215435444e-05, "1": 9.113844681598422e-07}, "score": 4.25270547975886}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9756326418200029, "4": 0.02427044800997778, "3": 9.666878597624492e-05, "2": 1.9245913335806576e-07, "1": 2.9992184676692485e-08}, "score": 4.975535516608752}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8918113195008547, "4": 0.10801001766522642, "3": 0.00017824358287841732, "2": 3.335523541344579e-07, "1": 4.434681259980641e-08}, "score": 4.891632312643496}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9714021381222296, "4": 0.028519061235046456, "3": 7.851451859675271e-05, "2": 1.6820455650006845e-07, "1": 3.5782639189550275e-08}, "score": 4.971323259628114}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9774914509422419, "4": 0.02245450088574196, "3": 5.371667947116034e-05, "2": 2.4038092123931015e-07, "1": 3.89352821986891e-08}, "score": 4.977437187694178}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8274802988918611, "5": 0.16085772505453635, "3": 0.011648425014477713, "2": 1.3325274336756288e-05, "1": 2.746357946887574e-07}, "score": 4.149181818293336}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.950546670746756, "5": 0.040343882768886286, "3": 0.009104907728599912, "2": 4.486027462776091e-06, "1": 3.300773199651091e-08}, "score": 4.031229904578036}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9145987175105327, "4": 0.08506087520016715, "3": 0.0003394745761247919, "2": 8.28939635919244e-07, "1": 1.4050904120914138e-07}, "score": 4.914257129942319}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9320084386425836, "5": 0.05953655412662762, "3": 0.008432713269294454, "2": 2.183994337086596e-05, "1": 3.7331248747681647e-07}, "score": 4.051059045153881}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7492014522598305, "4": 0.25050535035067045, "3": 0.0002926202103980278, "2": 5.016240009442443e-07, "1": 2.912482306792584e-08}, "score": 4.748907776198957}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7542554690435604, "5": 0.2293291663196011, "3": 0.016389749009172488, "2": 2.4669028697647103e-05, "1": 6.786379922105163e-07}, "score": 4.21288810038476}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9110566219784634, "4": 0.08886065592023373, "3": 8.254639987473179e-05, "2": 8.125154504328588e-08, "1": 0}, "score": 4.910973999116887}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7738547070524092, "4": 0.22568142456174137, "3": 0.0004631780595256277, "2": 5.945880643467793e-07, "1": 2.8017878855262746e-08}, "score": 4.773390308137404}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9725294501669834, "4": 0.027458502884330653, "3": 1.1884280470034325e-05, "2": 2.890830248118275e-08, "1": 8.441751720936906e-09}, "score": 4.972517604618772}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9943146192965048, "4": 0.005680903454538379, "3": 4.357827084274113e-06, "2": 4.073887665674698e-08, "1": 1.7520608855775882e-08}, "score": 4.994310188244225}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5740753037874833, "3": 0.42157233625553453, "5": 0.0034913423123313354, "2": 0.0008582758557083782, "1": 2.694321898285437e-06}, "score": 3.5801943514527523}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7509034330297605, "5": 0.2411742205056969, "3": 0.007904579530957972, "2": 1.705116547953475e-05, "1": 7.288360699338442e-07}, "score": 4.233233349087685}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8993222364221658, "4": 0.10049819619023007, "3": 0.00017928299910547404, "2": 2.1215854245496802e-07, "1": 2.692660515220835e-08}, "score": 4.899142489060329}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9796188025289266, "4": 0.020363978474083236, "3": 1.712310220676327e-05, "2": 6.003128463669545e-08, "1": 2.866634644347092e-08}, "score": 4.979601480415454}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9505849091567833, "4": 0.04933166559323923, "3": 8.313581185647309e-05, "2": 2.0189420790069985e-07, "1": 3.786237356191571e-08}, "score": 4.950501303191758}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "human", "scores": {"4": 0.92884113616117, "5": 0.06450947285468835, "3": 0.006647802035007499, "2": 1.4969348108520153e-06, "1": 2.82673050148255e-08}, "score": 4.057858595836457}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9600243358478947, "4": 0.03989931991374016, "3": 7.60991852090158e-05, "2": 9.717250848516546e-08, "1": 2.62539863102542e-08}, "score": 4.959948080310989}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6673104760733622, "5": 0.33124738369239703, "3": 0.001441595777718648, "2": 4.3323566328015284e-07, "1": 1.6373723707326628e-08}, "score": 4.329804903603232}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9969923594403148, "4": 0.0030048831408121582, "3": 2.694585954770024e-06, "2": 1.4015751957572143e-08, "1": 1.1402536571783709e-08}, "score": 4.996989639917245}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9861185168084545, "4": 0.013864055824462674, "3": 1.731549140857582e-05, "2": 5.4794829479926986e-08, "1": 1.1041808457021023e-08}, "score": 4.986101104001106}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8332022243097897, "4": 0.16637080777996652, "3": 0.00042459095980818646, "2": 1.6770563064268518e-06, "1": 5.191473929374916e-07}, "score": 4.832772872316169}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8966526564081996, "4": 0.10322471171465308, "3": 0.00012223819483975966, "2": 3.493599747654158e-07, "1": 5.6606614194762284e-08}, "score": 4.896529538660347}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.876557819897186, "5": 0.11352652147203221, "3": 0.009896382427343928, "2": 1.8828497713939388e-05, "1": 3.10865653628552e-07}, "score": 4.103591563627775}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9623981053458383, "4": 0.03758674565153393, "3": 1.5052010314131904e-05, "2": 3.932383552542262e-08, "1": 1.4458722084792145e-08}, "score": 4.96238297289602}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9532872711301483, "4": 0.046633318689480854, "3": 7.907715788913322e-05, "2": 2.6154669589366697e-07, "1": 6.472760920205258e-08}, "score": 4.953207483128454}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7156081058958322, "4": 0.2826615029191247, "3": 0.0017256308244771306, "2": 4.1832295087001175e-06, "1": 1.9857003060906549e-07}, "score": 4.713873783147038}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9998007707887756, "4": 0.00019911042253941132, "3": 4.8040136421045244e-08, "1": 0, "2": 0}, "score": 4.999800793483094}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9991214395604164, "4": 0.0008753561726269847, "3": 3.1638022816762192e-06, "2": 7.341578227957653e-09, "1": 0}, "score": 4.999118294168871}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9983552086543567, "4": 0.001642955212310531, "3": 1.7742619931567178e-06, "1": 0, "2": 0}, "score": 4.998353496161831}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.999954033236504, "4": 4.588368273825519e-05, "3": 3.464421778941494e-08, "1": 0, "2": 0}, "score": 4.999954047026599}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9313705993643384, "4": 0.06843237141552261, "3": 0.00019663251054712695, "2": 2.9516538812303287e-07, "1": 3.322583835530929e-08}, "score": 4.93117334046174}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9778110539326786, "4": 0.022150371735294796, "3": 3.8486308626856565e-05, "2": 5.710295330461415e-08, "1": 9.650269447158419e-09}, "score": 4.97777244526473}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9883627606239578, "4": 0.01161903590022569, "3": 1.8104953194048945e-05, "2": 1.657558512232221e-08, "1": 0}, "score": 4.9883447035115145}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9396953142851352, "4": 0.06024207201998152, "3": 6.228599230924354e-05, "2": 2.7131888782592977e-07, "1": 3.036825553318481e-08}, "score": 4.939632418995225}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9431779140600519, "4": 0.056806694459359944, "3": 1.5269854000162083e-05, "2": 4.011678546775515e-08, "1": 0}, "score": 4.943162640849482}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8388642880572128, "4": 0.16079841166359782, "3": 0.00033680783931199924, "2": 4.592946012425444e-07, "1": 0}, "score": 4.838526589421893}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8796874104601566, "4": 0.12005059500707527, "3": 0.000261787880115633, "2": 1.3750301401100355e-07, "1": 8.110024077158544e-09}, "score": 4.879425376923726}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7903474895826663, "4": 0.20914859474551628, "3": 0.000503173558831985, "2": 6.840854501545973e-07, "1": 0}, "score": 4.789842993685577}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9992149787405425, "4": 0.0007833213793616527, "3": 1.6166216296815006e-06, "2": 1.4378123311788448e-08, "1": 7.591793315463099e-09}, "score": 4.999213371827624}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9113468251457373, "4": 0.08853784422582753, "3": 0.000114978086492217, "2": 2.659996084921016e-07, "1": 2.0949270755306996e-08}, "score": 4.911231311982669}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6121913389439054, "5": 0.38588485003263434, "3": 0.0019204520076471165, "2": 3.142754227477629e-06, "1": 1.0959840669418293e-07}, "score": 4.383957824675475}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9062325936541741, "4": 0.09367697977669653, "3": 9.019559211449737e-05, "2": 1.2907386494276442e-07, "1": 0}, "score": 4.906142232253077}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9633274604317327, "3": 0.02898871971531955, "5": 0.007676132802371179, "2": 7.587245076260603e-06, "1": 5.3691829384331363e-08}, "score": 3.978672076537902}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8465117134477154, "4": 0.1533717141216926, "3": 0.00011634635460403712, "2": 1.596883074696123e-07, "1": 0}, "score": 4.846395103906705}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9231219497198645, "3": 0.06986957424270732, "5": 0.006737899833621552, "2": 0.0002682358304578883, "1": 2.090897831045809e-06}, "score": 3.936325565351293}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7314775861022116, "5": 0.2629758174213997, "3": 0.005502762720733216, "2": 4.208917399950681e-05, "1": 1.5027001020554696e-06}, "score": 4.257384430508908}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9351724670177688, "5": 0.035960146335156436, "3": 0.028321863804963394, "2": 0.0005387801258815879, "1": 6.600520819498887e-06}, "score": 4.006540921646061}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7340691096231313, "5": 0.2520558220324437, "3": 0.013834026959777259, "2": 3.9613047961412275e-05, "1": 1.2721654891192075e-06}, "score": 4.238138789670696}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7540446991794248, "4": 0.2449131796540098, "3": 0.0010343831709729548, "2": 7.188881224053917e-06, "1": 5.653380308560138e-07}, "score": 4.752994230015585}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6703541460837085, "4": 0.32877866676717926, "3": 0.000864205128581116, "2": 2.8730438939348446e-06, "1": 1.7136980725575434e-07}, "score": 4.669483638986711}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "human", "scores": {"4": 0.540488585789027, "5": 0.4519053155343418, "3": 0.007590073529047363, "2": 1.56708697341503e-05, "1": 4.044632328022473e-07}, "score": 4.444282664579631}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9426804095589558, "4": 0.05721919843124355, "3": 0.00010013713113649135, "2": 1.7996976003055565e-07, "1": 1.642646636750868e-08}, "score": 4.942579918333271}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9333198854847033, "4": 0.0660810870097034, "3": 0.0005986125483113632, "2": 2.7363465396221396e-07, "1": 3.4339758984768734e-08}, "score": 4.932720722432946}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9556165965562493, "4": 0.044327177608733476, "3": 5.60514802129492e-05, "2": 1.262273740875519e-07, "1": 1.2985012878941018e-08}, "score": 4.955560287246947}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9508713140967887, "5": 0.04354998152102579, "3": 0.0055547842251627896, "2": 2.298628096000212e-05, "1": 6.737147737156748e-07}, "score": 4.037947213462018}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8163025015754491, "4": 0.18216532957437098, "3": 0.0015243415997762823, "2": 6.863637561393632e-06, "1": 9.033859194697165e-07}, "score": 4.814761771613386}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9503770484723547, "4": 0.04956333164526149, "3": 5.939396120376568e-05, "2": 1.7684574173227383e-07, "1": 2.2819988419137794e-08}, "score": 4.950317257310709}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8026483911352087, "4": 0.19618487981179147, "3": 0.0011653590989714779, "2": 1.2821310264104517e-06, "1": 6.133623863981481e-08}, "score": 4.8014803049940875}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.965399874262204, "4": 0.03446494356858964, "3": 0.00013480220527676043, "2": 2.838607601994722e-07, "1": 6.144766500178096e-08}, "score": 4.965264353444136}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9990505213403873, "4": 0.0009479270596185801, "3": 1.532867336968896e-06, "2": 1.3576845933535049e-08, "1": 6.241926301751685e-09}, "score": 4.999048941508498}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7742076962354894, "5": 0.21188561538296521, "3": 0.01388747394730204, "2": 1.8815190670649725e-05, "1": 3.6521394660628447e-07}, "score": 4.1979594221489664}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8238201726212354, "5": 0.16850312219739372, "3": 0.00764352343136238, "2": 3.255407516710894e-05, "1": 5.602946673001867e-07}, "score": 4.160792820565943}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9261585024789031, "4": 0.07369862033320441, "3": 0.0001425736285665034, "2": 1.7336424385590974e-07, "1": 0}, "score": 4.92601570268454}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9948334761332545, "4": 0.005163722731616227, "3": 2.734363153073721e-06, "2": 9.850634180774398e-09, "1": 0}, "score": 4.9948307786959365}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.521570174914364, "4": 0.46788932316317056, "3": 0.010521859802370812, "2": 1.8031614131353377e-05, "1": 0}, "score": 4.511012563859947}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8851409810851713, "3": 0.10403735100903534, "5": 0.009292162277592381, "2": 0.0015156340692822493, "1": 1.3660637989101623e-05}, "score": 3.9021825405842763}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7057890656482739, "4": 0.29341637607137, "3": 0.0007937341313160405, "2": 7.247819398163576e-07, "1": 5.519574334234861e-08}, "score": 4.704993747506379}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9694761024098334, "4": 0.03046735184503086, "3": 5.6199033428144125e-05, "2": 2.1553080305651033e-07, "1": 5.711151939005007e-08}, "score": 4.969419372784537}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.987787590223683, "4": 0.01220146808068698, "3": 1.0740402423348522e-05, "2": 8.908293920364788e-08, "1": 4.509795207524192e-08}, "score": 4.987776602653499}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8218900105464794, "4": 0.17790764707316173, "3": 0.0002016360940189506, "2": 4.368025825944992e-07, "1": 0}, "score": 4.8216877222787895}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9289401874879092, "3": 0.06259702036575741, "5": 0.00843649787675157, "2": 2.60296964648413e-05, "1": 1.934989017893338e-07}, "score": 3.9457868337682007}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8211370770060434, "4": 0.1787666776896641, "3": 9.609954275613722e-05, "2": 8.698614359495422e-08, "1": 0}, "score": 4.821040851747998}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5396426595745467, "5": 0.45920811136977685, "3": 0.0011488089143438438, "2": 4.492474443510417e-07, "1": 1.2070842537577247e-08}, "score": 4.45805834888657}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.5979030870226362, "4": 0.4018467427470633, "3": 0.00024993316895987515, "2": 2.2253665663241417e-07, "1": 1.318004359782572e-08}, "score": 4.597652670043861}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5230744883057, "4": 0.476579132200577, "3": 0.00034591402376939033, "2": 3.852193209695811e-07, "1": 2.163096465421882e-08}, "score": 4.522727769592523}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6038163400812292, "4": 0.39397189685789097, "3": 0.0022100600320453054, "2": 1.4932494106651066e-06, "1": 7.766368991950496e-08}, "score": 4.601603140040534}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9698508521278829, "4": 0.03012857566322443, "3": 2.0505118911305547e-05, "2": 1.4595304055552779e-08, "1": 0}, "score": 4.969830368729296}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9428281033259766, "4": 0.05699134869201512, "3": 0.00018033884580830934, "2": 1.5535034194240385e-07, "1": 0}, "score": 4.94264750448059}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.941105218524449, "4": 0.058794615582305546, "3": 9.994345319135574e-05, "2": 1.1715218744435574e-07, "1": 0}, "score": 4.941005139843307}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9854946796835776, "4": 0.014495253905464252, "3": 1.0019152968125278e-05, "2": 1.0233880534748252e-08, "1": 0}, "score": 4.98548467654954}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6827228807720973, "5": 0.3147179934591182, "3": 0.0025563188616326456, "2": 2.7348471781867715e-06, "1": 1.3045428213897227e-07}, "score": 4.312155795312161}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6926940386172953, "5": 0.2975588376314413, "3": 0.009735914550393706, "2": 1.0913936581115602e-05, "1": 2.619097128549377e-07}, "score": 4.287800319078205}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5786965454041477, "4": 0.4162180905355573, "3": 0.0050775927388950915, "2": 6.8953864529571765e-06, "1": 2.820506985711431e-07}, "score": 4.5736046563950215}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5714450562008734, "5": 0.42403787496161766, "3": 0.004509612722487525, "2": 7.058394078276748e-06, "1": 2.1363219832473895e-07}, "score": 4.419513581782106}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9467553294603207, "3": 0.029868394433698105, "5": 0.02311266600078594, "2": 0.00026117078917228543, "1": 2.194358081486008e-06}, "score": 3.992715345130064}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7362836061739853, "3": 0.21514423829507365, "5": 0.04713839168012844, "2": 0.001414608308482828, "1": 1.8580191831660327e-05}, "score": 3.829109097870428}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6380923033530282, "4": 0.35994051402675065, "3": 0.001964691585349685, "2": 2.3491429463725948e-06, "1": 8.049618861824267e-08}, "score": 4.636122711048443}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5326227987517415, "4": 0.46610797298995543, "3": 0.0012687082780632503, "2": 5.391915224128564e-07, "1": 3.508711036454291e-08}, "score": 4.531352877977695}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.973324877427639, "4": 0.02666743289037763, "3": 7.5700264232440355e-06, "2": 1.145224564471962e-08, "1": 5.414691118222002e-09}, "score": 4.973317368298603}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9536697170698754, "4": 0.04627238185874943, "3": 5.7712948435437194e-05, "2": 8.622204064698496e-08, "1": 1.2668655057300363e-08}, "score": 4.953611878764321}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "human", "scores": {"3": 0.5450570014344728, "4": 0.2892391570619769, "2": 0.09721061166174412, "5": 0.053570442976943605, "1": 0.014922322989182986}, "score": 3.26932491030903}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9948304070767147, "4": 0.005158241768981548, "3": 1.1272099006557726e-05, "2": 8.071325700558906e-08, "1": 1.3765257385219423e-08}, "score": 4.994818916912114}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9947172794058354, "4": 0.005277219129645365, "3": 5.539751022511071e-06, "2": 1.3943254416526678e-08, "1": 0}, "score": 4.994711659814755}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7978458664501481, "4": 0.20190332202195904, "3": 0.0002500394131319705, "2": 7.754556847989964e-07, "1": 3.0733486848313996e-08}, "score": 4.797594156747635}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9254243073468819, "3": 0.06746851057184904, "5": 0.0067850094019491535, "2": 0.0003209638686154029, "1": 1.034212800356368e-06}, "score": 3.938671457746634}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8527458451421258, "4": 0.14696845603881098, "3": 0.00028531663340205393, "2": 3.0958380686696044e-07, "1": 3.673459069628788e-08}, "score": 4.852459829712741}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6922724409842623, "4": 0.30677773003953995, "3": 0.0009466141427754966, "2": 2.7216424989453965e-06, "1": 2.9461954232575056e-07}, "score": 4.691319636974157}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8178962288690784, "5": 0.17940976489247099, "3": 0.0026935291326325153, "2": 5.020189344189251e-07, "1": 1.5193015823286525e-08}, "score": 4.176715179055561}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7829677042582704, "5": 0.21424179898924728, "3": 0.0027885776946448807, "2": 1.8928157930634338e-06, "1": 6.561011242871174e-08}, "score": 4.211449230508331}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8891710586934463, "4": 0.1107976183429174, "3": 3.125034943263685e-05, "2": 1.9200932334559293e-08, "1": 3.4481706255534333e-09}, "score": 4.889139804023598}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9379532606019282, "4": 0.061578413503231455, "3": 0.00046693803334951, "2": 1.017566057867383e-06, "1": 3.015285898203533e-07}, "score": 4.937483447318471}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8062962404666277, "5": 0.18377154427629924, "3": 0.009921084887558041, "2": 1.0527370269472822e-05, "1": 4.893308457843255e-07}, "score": 4.173827956414409}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7228101700584127, "5": 0.27266280329298825, "3": 0.004519870210687198, "2": 6.699805914312461e-06, "1": 3.356345223812841e-07}, "score": 4.268128559009784}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8900394512421533, "4": 0.10969656772728976, "3": 0.00026180489688087927, "2": 1.4779951749856312e-06, "1": 6.329363327718592e-07}, "score": 4.889772849561044}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9512261713016452, "4": 0.04873178462891343, "3": 4.18944582969218e-05, "2": 7.844751770612308e-08, "1": 4.0965851808546576e-08}, "score": 4.951184025774397}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6497752923102385, "4": 0.3456015351766626, "3": 0.0046173760028160584, "2": 5.589638175467156e-06, "1": 1.6529931105077792e-07}, "score": 4.645146267953673}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9278987247164613, "3": 0.0418613212046747, "5": 0.02999246786530863, "2": 0.00024643482526233456, "1": 1.1348012868772243e-06}, "score": 3.9876348736376603}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9888158459225564, "4": 0.011178100805163436, "3": 6.015518566705977e-06, "2": 1.3155604123755719e-08, "1": 0}, "score": 4.988809828415633}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6354366745333913, "4": 0.36419832894083254, "3": 0.00036406708786085405, "2": 9.020246401657216e-07, "1": 7.114498498476098e-08}, "score": 4.635070562188574}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5146277784123308, "4": 0.48482764128523104, "3": 0.0005441581698326819, "2": 3.86144185370488e-07, "1": 1.2259447165398867e-08}, "score": 4.514082823374443}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8304432538146156, "4": 0.1694112988086454, "3": 0.00014501824440152697, "2": 3.6287914209720215e-07, "1": 7.180541111595301e-08}, "score": 4.830297289785707}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8913097756942724, "4": 0.10816857382472302, "3": 0.0005192801668130462, "2": 1.9517971391298743e-06, "1": 3.4491114631465375e-07}, "score": 4.890785622766826}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9390684741641978, "3": 0.05095010797913231, "5": 0.009913065940815051, "2": 6.774533206416884e-05, "1": 5.418671371319607e-07}, "score": 3.9588258390314883}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8045494561863163, "4": 0.19520780913281505, "3": 0.00024225952235474828, "2": 3.926473327868975e-07, "1": 4.901222892868637e-08}, "score": 4.804306291276027}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9678121446334599, "5": 0.027441000923109766, "3": 0.004744878752185699, "2": 1.7673010599396583e-06, "1": 2.5901343422279982e-08}, "score": 4.0226925140059056}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9067826533981761, "4": 0.0928693232768128, "3": 0.0003474825882396306, "2": 3.978495174571253e-07, "1": 0}, "score": 4.906434504628839}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9999269756164101, "4": 7.269012607856858e-05, "3": 2.15943616081061e-07, "1": 5.439275310141443e-09, "2": 3.2619717275451576e-09}, "score": 4.999926846435654}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.913667051637878, "4": 0.0861996639337917, "3": 0.00013266691095238577, "2": 4.382689823969165e-07, "1": 4.709909738067118e-08}, "score": 4.913533487614476}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9223989263521951, "4": 0.07745213084294851, "3": 0.0001477944649123823, "2": 9.888323839705517e-07, "1": 8.791925504390006e-08}, "score": 4.922248956486988}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7326307175637444, "5": 0.26311170582563226, "3": 0.004252675349899968, "2": 4.815137290676059e-06, "1": 7.275443285764502e-08}, "score": 4.258849185398407}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9011218967627879, "3": 0.06607385813421124, "5": 0.032635768461964317, "2": 0.00016691046951414204, "1": 1.394863495732948e-06}, "score": 3.96622389901212}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6806794898161697, "4": 0.31601812798484563, "3": 0.003299857477759772, "2": 2.415242166267173e-06, "1": 9.71878629544775e-08}, "score": 4.677374518616231}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9045320145723299, "4": 0.09525917920616976, "3": 0.00020790652049080464, "2": 7.20243130995377e-07, "1": 1.1802185709676913e-07}, "score": 4.904322369057974}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.8703874253179856, "5": 0.12179135539421694, "3": 0.007815080612990232, "2": 5.993326246753716e-06, "1": 8.18145284250622e-08}, "score": 4.113964049925745}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5208167638259109, "4": 0.4780140278283783, "3": 0.0011666020341377233, "2": 2.4320841337236265e-06, "1": 8.229652119190303e-08}, "score": 4.519645098505394}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5212033011512844, "5": 0.4748833566741587, "3": 0.003906481039955591, "2": 6.664797415962314e-06, "1": 1.8212656126069553e-07}, "score": 4.470963006352364}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9793882244644038, "4": 0.02060636644921988, "3": 5.357795257810619e-06, "2": 8.172197437831789e-09, "1": 0}, "score": 4.979382892554684}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9964499546642933, "4": 0.0035452719792809302, "3": 4.795694604275813e-06, "2": 9.388577933282588e-09, "1": 3.6345482919363546e-09}, "score": 4.99644509405329}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9720561263794861, "4": 0.027931997039162024, "3": 1.1683289324072912e-05, "2": 3.971896720482974e-08, "1": 8.903547892831494e-09}, "score": 4.972044477566785}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9987189220818085, "4": 0.00128014016901897, "3": 9.316766728439916e-07, "2": 6.450449620265272e-09, "1": 0}, "score": 4.998717977126771}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8128757094717741, "4": 0.18558520059180522, "3": 0.0015303120654948188, "2": 7.88971141358805e-06, "1": 8.24926125062454e-07}, "score": 4.811327194508045}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8788089536745262, "5": 0.10902435296616177, "3": 0.012148677048756207, "2": 1.725958356107708e-05, "1": 5.403028614884573e-07}, "score": 4.0968395568001155}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.71365092268322, "4": 0.2843020356877376, "3": 0.0020419490716024917, "2": 4.488881483724875e-06, "1": 3.294306419505485e-07}, "score": 4.711599202709471}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7750033399695093, "4": 0.2242292977568452, "3": 0.0007646782506462081, "2": 2.42786569832883e-06, "1": 2.1972237924474756e-07}, "score": 4.774233175029454}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9631688616223779, "5": 0.024659797326357716, "3": 0.012108906775709628, "2": 6.120265420644875e-05, "1": 9.453245776611003e-07}, "score": 4.012425652825927}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "human", "scores": {"3": 0.6165472604682605, "4": 0.3603807383053048, "2": 0.018313673726114282, "5": 0.004697494488316816, "1": 6.057089868202566e-05}, "score": 3.3513410038496176}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8011506277239019, "4": 0.1974491294941285, "3": 0.0013892878517491934, "2": 1.0481801447479159e-05, "1": 4.171287123768262e-07}, "score": 4.799739169668563}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7775924774063893, "4": 0.22131857491453522, "3": 0.0010770510303390126, "2": 1.1517366860039827e-05, "1": 3.7773611257629954e-07}, "score": 4.776491259634265}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8762281296278982, "4": 0.12262222393589542, "3": 0.0011419241368884868, "2": 6.766740833695863e-06, "1": 7.995522127904371e-07}, "score": 4.875070409869177}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9485815599062022, "4": 0.05114839834387405, "3": 0.0002669348331375481, "2": 2.6156681144046865e-06, "1": 4.0669797627935075e-07}, "score": 4.94830825382303}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9215958095316612, "5": 0.05804230719193158, "3": 0.02034381590517596, "2": 1.7449021245011144e-05, "1": 3.4692611664559506e-07}, "score": 4.037662562688434}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9323985713969613, "4": 0.06742855406247288, "3": 0.00017220498801238593, "2": 5.425541179051267e-07, "1": 0}, "score": 4.932225399691881}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5579941502939234, "4": 0.4400781078426721, "3": 0.001923851716759519, "2": 3.523978327080206e-06, "1": 1.989554314237564e-07}, "score": 4.556062746735073}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7995774726715112, "4": 0.20020590840980795, "3": 0.0002158108992844964, "2": 5.92968831522717e-07, "1": 5.244861020377364e-08}, "score": 4.799360448466304}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6960382453095657, "4": 0.30351046136475696, "3": 0.0004496775444258426, "2": 1.44366144695475e-06, "1": 0}, "score": 4.695585800166338}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "human", "scores": {"5": 0.936311798425554, "4": 0.0636074231024151, "3": 8.03737843699896e-05, "2": 2.9359458025452013e-07, "1": 4.3413733751994645e-08}, "score": 4.936230770574309}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9034012609319395, "4": 0.0965185945077398, "3": 7.981844020023366e-05, "2": 2.0811458905946007e-07, "1": 1.3414669365492866e-08}, "score": 4.903321080497684}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9973283951052889, "4": 0.0026698916177416627, "3": 1.7225238293307617e-06, "2": 5.285249551035507e-09, "1": 0}, "score": 4.9973266475177}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9951306439404795, "4": 0.004866479006439867, "3": 2.8511731979048527e-06, "2": 1.4571955669130374e-08, "1": 0}, "score": 4.995127774876202}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7469519648499362, "4": 0.2525709701142554, "3": 0.0004756184503788929, "2": 1.3045342205750206e-06, "1": 5.661963521338673e-08}, "score": 4.746473631244627}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "human", "scores": {"5": 0.882166487015388, "4": 0.11736569739678948, "3": 0.000466599765942741, "2": 1.0436796126889895e-06, "1": 8.254064485633673e-08}, "score": 4.881697631269823}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.948769307517298, "5": 0.047388585098017584, "3": 0.003839745080010664, "2": 2.2759591272766337e-06, "1": 4.284246728520291e-08}, "score": 4.043544161466657}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6478391621479594, "4": 0.3509887525664213, "3": 0.0011710353581370434, "2": 9.687018119686769e-07, "1": 7.891930201819098e-08}, "score": 4.646665954119742}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7704468559958709, "4": 0.2294300704120931, "3": 0.0001227756318065596, "2": 2.271300672675316e-07, "1": 3.5517155630464886e-08}, "score": 4.770323546754904}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8859841304441969, "4": 0.11388890765161203, "3": 0.00012659165078430723, "2": 2.7941603526064804e-07, "1": 6.531670591996242e-08}, "score": 4.885856806618879}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9264121564519389, "3": 0.0418093199079186, "5": 0.03173952593121455, "2": 3.842631679119684e-05, "1": 3.572935943533813e-07}, "score": 3.989852279336318}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7374376918237416, "5": 0.25862808875520604, "3": 0.003931460081845979, "2": 2.5850001292600355e-06, "1": 6.547516018822971e-08}, "score": 4.254691289974313}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7184509306138605, "4": 0.28082080996906994, "3": 0.0007277787287446584, "2": 4.886917081363219e-07, "1": 2.1024718920491444e-08}, "score": 4.717722090593433}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9919042465613147, "4": 0.00808220942613091, "3": 1.337595320577677e-05, "2": 9.861820080796755e-08, "1": 3.035899462760716e-08}, "score": 4.991890621059945}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5536247103095799, "4": 0.44468707341058117, "3": 0.0016846209432172235, "2": 3.4924886347784102e-06, "1": 5.722768798477117e-08}, "score": 4.551932957885375}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9400149026131328, "3": 0.056041174471354024, "5": 0.003910988983544975, "2": 3.279659037366402e-05, "1": 1.1618408082237137e-07}, "score": 3.9478038716748602}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9892477679741679, "4": 0.010735717633523491, "3": 1.634348844814342e-05, "2": 9.659614532422854e-08, "1": 4.470734639273136e-08}, "score": 4.989231126452996}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8697286695994026, "4": 0.12990390424286657, "3": 0.0003670042975620234, "2": 4.058370956927205e-07, "1": 2.6285983147698458e-08}, "score": 4.869360765847529}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8419556906968249, "4": 0.1578467584222335, "3": 0.00019717636025196432, "2": 2.794803083398788e-07, "1": 2.4178403973427143e-08}, "score": 4.841757942489377}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9329659163923347, "4": 0.0670200265850279, "3": 1.3912629962314334e-05, "2": 1.8977059158509382e-08, "1": 0}, "score": 4.932952082815015}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9023306200535143, "4": 0.09745261686276906, "3": 0.00021487072279695882, "2": 1.5306072589957582e-06, "1": 2.100210653645538e-07}, "score": 4.902112194932828}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9493766382733883, "4": 0.05055358581639221, "3": 6.91449867966012e-05, "2": 4.532663115424177e-07, "1": 0}, "score": 4.949306755405065}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9992397356475045, "4": 0.000753414814028593, "3": 6.617545679735469e-06, "1": 0, "2": 0}, "score": 4.999233349916755}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7567980938082144, "4": 0.24293584083235353, "3": 0.00026562872363320995, "2": 1.7307358258772437e-07, "1": 0}, "score": 4.756532318330751}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6992141621882798, "5": 0.28224575949441005, "3": 0.018439577006993595, "2": 9.913678448311209e-05, "1": 1.1980078568344407e-06}, "score": 4.263604358789744}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7047106894281351, "4": 0.29495062781149206, "3": 0.0003383329798281325, "2": 2.8463192004722516e-07, "1": 0}, "score": 4.704371833073323}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8909800467340154, "4": 0.10881379068208857, "3": 0.00020592469793645046, "2": 1.6794656056837637e-07, "1": 0}, "score": 4.890773848443145}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7369038917333238, "5": 0.26021558980456166, "3": 0.0028784811569643235, "2": 1.927599715062638e-06, "1": 3.664605698781479e-08}, "score": 4.257333162310597}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9808787102005444, "4": 0.01911358959123872, "3": 7.733438259603408e-06, "2": 2.212848819385251e-08, "1": 0}, "score": 4.980870878205738}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9012834869110148, "5": 0.09825841333407365, "3": 0.0004569420410266528, "2": 9.673001467954365e-07, "1": 0}, "score": 4.097799555315132}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8643648839009387, "3": 0.07189064744327464, "5": 0.06175578646062412, "2": 0.0019300854546978965, "1": 5.8413122092800217e-05}, "score": 3.9858297261397535}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5508961682302855, "4": 0.44403416558260606, "3": 0.0049387234110203244, "2": 0.0001153554877158229, "1": 1.508484440435623e-05}, "score": 4.545681753485125}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8612079519199612, "3": 0.10138217421250167, "5": 0.036570089480347845, "2": 0.0008243280403974671, "1": 1.5256452952270849e-05}, "score": 3.9334934765339504}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5311531665961995, "5": 0.4656329109653236, "3": 0.0032002415104778435, "2": 1.2786047763723197e-05, "1": 7.270082583400771e-07}, "score": 4.462404993959384}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8903500490892827, "5": 0.10267405735947681, "3": 0.006942821714457066, "2": 3.181212663966896e-05, "1": 1.2243015987734511e-06}, "score": 4.095663941874266}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8892444761327211, "5": 0.10724551931451218, "3": 0.003505519333997943, "2": 4.359348231351249e-06, "1": 8.99732889600136e-08}, "score": 4.103731015087843}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9712389504432507, "4": 0.028684252505267908, "3": 7.637317775032738e-05, "2": 2.9458654678479446e-07, "1": 6.8284161043081e-08}, "score": 4.971161842483733}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5818822333044583, "4": 0.41717759523254266, "3": 0.0009397496950699575, "2": 4.870091137369572e-07, "1": 5.367073264116494e-08}, "score": 4.580941279498121}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9715260095061138, "4": 0.02843606059476067, "3": 3.763980213634071e-05, "2": 1.8579832977079502e-07, "1": 3.341509810602855e-08}, "score": 4.971487966724551}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9682898255101472, "4": 0.03168544347291138, "3": 2.4546727794509187e-05, "2": 5.5790401415457925e-08, "1": 1.4659547606533033e-08}, "score": 4.968265233449444}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9223786374885488, "3": 0.04204076652118913, "5": 0.03553623140514664, "2": 4.3853895769601576e-05, "1": 4.1117743511675795e-07}, "score": 3.9934065229039835}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.664140105170927, "5": 0.33100056389375987, "3": 0.004853760566229171, "2": 5.326394514480086e-06, "1": 1.2462906392106113e-07}, "score": 4.326135815574154}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5175923581041364, "5": 0.46231842209187185, "3": 0.020035000699101888, "2": 5.354024199449739e-05, "1": 5.295458947625359e-07}, "score": 4.442174818295315}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9966643618432945, "4": 0.0033294252083291196, "3": 6.116851834008898e-06, "2": 3.182537211608157e-08, "1": 1.3164289688398442e-08}, "score": 4.996658192783938}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8291848742202484, "5": 0.16583064868778774, "3": 0.004970492247577212, "2": 1.3765446259857666e-05, "1": 1.9587032574770347e-07}, "score": 4.160832041720739}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8926838697680525, "4": 0.10682535225089584, "3": 0.000489369074301276, "2": 1.2229910736726256e-06, "1": 1.4526531614385238e-07}, "score": 4.892191655183569}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8735843923943946, "4": 0.12490310528374193, "3": 0.0015104790905009894, "2": 1.9849794430993105e-06, "1": 9.366727140691827e-08}, "score": 4.872069614017147}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9832354535828445, "4": 0.01672506143050002, "3": 3.942864402856291e-05, "2": 5.282242608240432e-08, "1": 1.2597379762145205e-08}, "score": 4.983195872577179}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9907948858671555, "4": 0.009198526231385468, "3": 6.444748144459874e-06, "2": 2.7286766387343743e-08, "1": 0}, "score": 4.990788501344722}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9834576958078591, "4": 0.01651853161715391, "3": 2.3657390432057108e-05, "2": 7.113730174128518e-08, "1": 7.499458642569885e-09}, "score": 4.983433909586789}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7273897775044668, "4": 0.26686795325845936, "3": 0.005723135267880806, "2": 1.834809139582373e-05, "1": 7.282903761053132e-07}, "score": 4.721627802739351}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7937863377345854, "5": 0.19381464786556873, "3": 0.012384155570454082, "2": 1.4709867954084823e-05, "1": 1.817439515574783e-07}, "score": 4.181400521380585}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8776083372581339, "5": 0.107447212341931, "3": 0.014923198955251809, "2": 2.0961586700854316e-05, "1": 2.249560021193166e-07}, "score": 4.0924814213474985}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9867159847869106, "4": 0.013254144274764845, "3": 2.9684723641109375e-05, "2": 9.342778985928614e-08, "1": 3.106400759567839e-08}, "score": 4.98668608091678}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5940530582235133, "5": 0.39961264043013367, "3": 0.006317723129839717, "2": 1.6156598756705738e-05, "1": 4.3953345593472236e-07}, "score": 4.393261278456861}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9717903724351332, "4": 0.028159159371562447, "3": 5.012914412221904e-05, "2": 2.6301033735730653e-07, "1": 3.481909130061108e-08}, "score": 4.971739652867932}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8459493086707662, "4": 0.15383682749832836, "3": 0.00021365841709432984, "2": 1.5438991790971266e-07, "1": 1.2995898880331076e-08}, "score": 4.845735334647758}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5505305276234946, "4": 0.4477028087600674, "3": 0.0017659037146543675, "2": 7.380022231146505e-07, "1": 3.0455263517838375e-08}, "score": 4.548763051843549}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9053034795279089, "4": 0.0945670662906826, "3": 0.00012871962095621848, "2": 6.240620714790677e-07, "1": 4.274164924256777e-08}, "score": 4.905173444889456}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7729990031357575, "4": 0.22676485034079658, "3": 0.00023551357567286492, "2": 5.404109328675323e-07, "1": 5.977053638497627e-08}, "score": 4.772762254747173}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6083942072059921, "4": 0.388518380049037, "3": 0.0030795512212480596, "2": 7.4253072029256185e-06, "1": 4.2600191303271456e-07}, "score": 4.6052985335474865}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5699644434565715, "4": 0.42899114555459544, "3": 0.0010425902888833445, "2": 1.7521096180976473e-06, "1": 4.745447531023716e-08}, "score": 4.568918218609599}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7761729965084663, "5": 0.20927022909418017, "3": 0.014540439214621767, "2": 1.5904650614935684e-05, "1": 3.5743403833139653e-07}, "score": 4.194696922508184}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9952353646594861, "4": 0.004760309461175769, "3": 4.35255294980803e-06, "2": 1.646106403673086e-08, "1": 0}, "score": 4.995230936255444}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9155400950792347, "5": 0.07049392098815885, "3": 0.013650863490154215, "2": 0.0003122891614028628, "1": 2.4904877080009034e-06}, "score": 4.056211026868418}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9168122513001167, "3": 0.0714399244460885, "5": 0.011637495768360822, "2": 0.00010897942009818283, "1": 8.293048642645036e-07}, "score": 3.9399770933699494}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.621375798198519, "4": 0.3781349032979365, "3": 0.0004886959700440221, "2": 6.605929474652565e-07, "1": 0}, "score": 4.620885744994297}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8021168367443922, "4": 0.19718001219267334, "3": 0.0007023062468453299, "2": 7.30138204127703e-07, "1": 6.575007665721603e-08}, "score": 4.801412912182287}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9928347477063446, "4": 0.007148193582505319, "3": 1.6840076607861817e-05, "2": 1.1590626880654932e-07, "1": 9.111567352533407e-08}, "score": 4.992817413999371}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9061885427584623, "5": 0.07609096854007721, "3": 0.0176464790986193, "2": 7.332059646009599e-05, "1": 4.884535289894894e-07}, "score": 4.058296394579459}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6185318579924743, "5": 0.37587046610035046, "3": 0.0055786135567170774, "2": 1.8182772101652334e-05, "1": 6.687710918624337e-07}, "score": 4.370253558738295}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8234476100731759, "4": 0.17541410255923567, "3": 0.001133588516222902, "2": 4.289064131449718e-06, "1": 3.4795279949711096e-07}, "score": 4.822304450417023}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5168234252731924, "4": 0.47904406119899334, "3": 0.004119095411677659, "2": 1.2997961766336757e-05, "1": 4.222708095241579e-07}, "score": 4.512677066040504}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9882080178628824, "4": 0.011754219458534113, "3": 3.700054188080985e-05, "2": 5.554040333703848e-07, "1": 1.595413022447299e-07}, "score": 4.988169474522097}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7450577476369185, "4": 0.2536875721444278, "3": 0.0012503200755572597, "2": 4.1375861323142874e-06, "1": 1.9300688019464647e-07}, "score": 4.743798595347767}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9013941758260618, "4": 0.09855860826347539, "3": 4.708716967980881e-05, "2": 8.881893301907247e-08, "1": 0}, "score": 4.9013469470019535}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.989981400899679, "4": 0.010003728554814231, "3": 1.4550153712057466e-05, "2": 1.0710694667694572e-07, "1": 0}, "score": 4.989966847677002}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8733065581255117, "4": 0.1259531457895988, "3": 0.0007359314368709991, "2": 3.8173465390258025e-06, "1": 4.822906000026207e-07}, "score": 4.8725616018497595}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9838893228837731, "4": 0.01610844999925967, "3": 2.1495909279443134e-06, "1": 0, "2": 0}, "score": 4.983887249569727}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.999988005296937, "5": 1.0773776266270776e-05, "3": 9.828581798450365e-07, "2": 1.2825440583452827e-07, "1": 0}, "score": 4.000009534410322}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9370013274898011, "5": 0.054115685491765146, "3": 0.008845084482274545, "2": 3.6862086545989566e-05, "1": 8.452444174451368e-07}, "score": 4.045194349925319}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8957018303657046, "5": 0.1033667019709213, "3": 0.0009308165930877353, "2": 5.994969200639772e-07, "1": 5.462976768821242e-09}, "score": 4.102434674718365}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8681462827563345, "5": 0.12437180155185953, "3": 0.0074745078599992645, "2": 7.168672979856467e-06, "1": 1.4332472168490056e-07}, "score": 4.116882537573068}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9364467306773424, "4": 0.0635226146667998, "3": 3.0510612013419297e-05, "2": 7.287428526560068e-08, "1": 1.2817787272498797e-08}, "score": 4.936416090504935}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9375519775073057, "4": 0.06241532754723491, "3": 3.253103503905841e-05, "2": 5.3842054121862965e-08, "1": 1.4538144303217306e-08}, "score": 4.93751938473516}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6990221703586644, "5": 0.2977694349990997, "3": 0.0032060167507358102, "2": 2.3876999963384553e-06, "1": 7.033509113570343e-08}, "score": 4.2945584082361306}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9345982697913987, "4": 0.06528826943206643, "3": 0.00011303681453111186, "2": 3.120654173878317e-07, "1": 5.475851254837495e-08}, "score": 4.93448449796514}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.673913813090057, "4": 0.32483341412024813, "3": 0.0012520901551387271, "2": 6.923079263697569e-07, "1": 4.7575305611563256e-08}, "score": 4.672660157084245}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9222669857007275, "5": 0.06802442820553324, "3": 0.00968534171339113, "2": 2.264682256459069e-05, "1": 5.158880770159454e-07}, "score": 4.058292249943492}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.750777472035739, "5": 0.24813135891501312, "3": 0.0010898840113594882, "2": 1.1824245785115775e-06, "1": 4.800416783078452e-08}, "score": 4.247038979532579}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "human", "scores": {"4": 0.952840829251409, "5": 0.03819047652804355, "3": 0.008964669842387559, "2": 3.7489828304084785e-06, "1": 0}, "score": 4.029218316766584}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8580664456587278, "4": 0.14152487249444093, "3": 0.000408000319692651, "2": 4.6271801836700547e-07, "1": 0}, "score": 4.857657707566328}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8426774211704546, "5": 0.14671775086918176, "3": 0.010596012795443964, "2": 8.80470781986968e-06, "1": 4.024198432979862e-08}, "score": 4.136104003878303}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9761907862081797, "4": 0.02379519760423415, "3": 1.3856473968440243e-05, "2": 4.863545720154615e-08, "1": 0}, "score": 4.976176940895235}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5681107482236404, "5": 0.4311436283329386, "3": 0.0007448132813930716, "2": 7.355266968580717e-07, "1": 0}, "score": 4.430397376121003}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5045601294836052, "4": 0.49384311164452893, "3": 0.0015953747777027272, "2": 1.3038384371850666e-06, "1": 5.901784388719846e-08}, "score": 4.502961980657343}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8843460355574512, "5": 0.11220530560269439, "3": 0.003447171290675022, "2": 1.3402217133020106e-06, "1": 0}, "score": 4.1087554698912605}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6783876902074987, "5": 0.32127385137611747, "3": 0.0003382409657720982, "2": 1.5251849035796017e-07, "1": 0}, "score": 4.320935326212376}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.7268859655075918, "5": 0.2716070843160178, "3": 0.0015058865265794672, "2": 9.848061669119182e-07, "1": 4.986806594866258e-08}, "score": 4.270099086399183}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.976179197916139, "5": 0.021867741914280106, "3": 0.0019524837479466092, "2": 5.663531575797808e-07, "1": 1.5663729816473134e-08}, "score": 4.019914078357405}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9276112366441234, "5": 0.057260708843802244, "3": 0.015108443790903108, "2": 1.9334432195555852e-05, "1": 3.2810423152621337e-07}, "score": 4.0421126096937385}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8133348212166003, "4": 0.18565141064071652, "3": 0.0010117079871525612, "2": 1.8599610710522332e-06, "1": 1.6027864582860528e-07}, "score": 4.81231894489574}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5393499019249819, "5": 0.4596528262459453, "3": 0.000996480885630658, "2": 7.275508088469761e-07, "1": 4.6961392921249596e-08}, "score": 4.458654756910787}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6165487216869994, "4": 0.3828603299771554, "3": 0.0005897723163714291, "2": 1.097898126661113e-06, "1": 8.108263638846187e-08}, "score": 4.615956508502441}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7097810264263568, "5": 0.2857542509364063, "3": 0.004454987606471706, "2": 9.52860719982961e-06, "1": 1.7201588667650542e-07}, "score": 4.281279699746056}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "human", "scores": {"5": 0.6054207246463668, "4": 0.3942298910578979, "3": 0.00034881704485264505, "2": 5.18358888315553e-07, "1": 2.000175134452411e-08}, "score": 4.605070828359127}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9294628410250624, "4": 0.07040696401801716, "3": 0.00012946150237219824, "2": 6.223669290834144e-07, "1": 7.558711536242602e-08}, "score": 4.929331941019238}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8069178118102113, "4": 0.19276549127281573, "3": 0.000316451995775103, "2": 1.653069149939755e-07, "1": 2.034578646120061e-08}, "score": 4.806601015969275}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9945261110278977, "4": 0.0054717543053939, "3": 2.124655258591213e-06, "2": 1.157913575665398e-08, "1": 0}, "score": 4.994523961655267}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9515403732355222, "4": 0.0483860611260986, "3": 7.33575960333677e-05, "2": 1.6592482709204054e-07, "1": 3.891959444125839e-08}, "score": 4.9514665700737694}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7131232160243404, "3": 0.27932966491972877, "5": 0.006578733693248145, "2": 0.0009641001294727958, "1": 4.25808512462802e-06}, "score": 3.7253080868018404}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8950300820885544, "4": 0.10442343035773692, "3": 0.0005456880950142898, "2": 7.449177703707001e-07, "1": 5.297816443916827e-08}, "score": 4.894482746621367}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7982536379426586, "4": 0.20088917322044036, "3": 0.000856270694432162, "2": 8.022456333301926e-07, "1": 9.131123509646469e-08}, "score": 4.7973955084277025}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9982208508655525, "4": 0.001776693902238216, "3": 2.4460526401968974e-06, "2": 2.0432317467858413e-08, "1": 7.792017692583433e-09}, "score": 4.9982183215613905}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8228067068374384, "5": 0.17384423184453188, "3": 0.0033160764071876094, "2": 3.178719570658624e-05, "1": 8.651162032671884e-07}, "score": 4.170462042392815}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7591339233879695, "4": 0.23887528101789887, "3": 0.0019837156538951347, "2": 6.625657140448475e-06, "1": 4.5838701442056375e-07}, "score": 4.757135578151527}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7930975984118659, "4": 0.2060660150750532, "3": 0.0008336504234591325, "2": 2.3223789225413116e-06, "1": 1.4826916982621007e-07}, "score": 4.792259068721511}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7009860936631682, "4": 0.29625678021292834, "3": 0.002752201891128347, "2": 4.499717234230426e-06, "1": 2.1238163829941854e-07}, "score": 4.698224403309724}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9265663668832304, "4": 0.07319582464577494, "3": 0.00023640313762382512, "2": 1.062319322520869e-06, "1": 1.9199912926635117e-07}, "score": 4.926327402998831}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9416242917441019, "4": 0.058182520756346084, "3": 0.00019227344623607082, "2": 7.653879557257754e-07, "1": 1.3387932532726793e-07}, "score": 4.941430099803997}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8406797400810573, "4": 0.15906074590616665, "3": 0.0002592494065397438, "2": 2.0219889404182472e-07, "1": 2.6551090942225037e-08}, "score": 4.840420036757767}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5810555010084063, "4": 0.41806222244986585, "3": 0.0008811756290204139, "2": 9.413065311322114e-07, "1": 5.566579344152465e-08}, "score": 4.580172336072278}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9736462717401975, "4": 0.026322441886126757, "3": 3.122292366750772e-05, "2": 1.2438665877007948e-08, "1": 0}, "score": 4.973615073604611}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8745310754929067, "4": 0.12535198736201572, "3": 0.00011685987388919481, "2": 7.492336843176029e-08, "1": 9.924235907367565e-09}, "score": 4.874414029374648}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.906056602250913, "3": 0.08121524525430265, "5": 0.012384383441012982, "2": 0.00034103423153020174, "1": 2.393425391253346e-06}, "score": 3.9304798657135214}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7484521687274989, "3": 0.24193429450523352, "5": 0.005314911065849482, "2": 0.004276830846871759, "1": 2.155540415497725e-05}, "score": 3.7547622299321275}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9593058941091022, "4": 0.04060459668259844, "3": 8.887865904492792e-05, "2": 4.296770315011813e-07, "1": 6.311578122599507e-08}, "score": 4.959216098886847}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7827053600820648, "5": 0.20544582604885084, "3": 0.011821225407505529, "2": 2.6957527124385526e-05, "1": 5.812551615489833e-07}, "score": 4.193568951437982}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9622939920139713, "4": 0.03763740911210689, "3": 6.75710446673164e-05, "2": 8.345443079894833e-07, "1": 1.43767273645168e-07}, "score": 4.962224368225979}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9779328048549625, "4": 0.02204980545567689, "3": 1.7289814276469792e-05, "2": 6.560401097197779e-08, "1": 3.642592829804159e-08}, "score": 4.977915272447613}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8387142370464351, "5": 0.1593974835124524, "3": 0.001885812531055715, "2": 2.358987633066294e-06, "1": 1.0103104410061403e-07}, "score": 4.157506650998437}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6996836322704751, "5": 0.287638556265933, "3": 0.012636868073006728, "2": 3.923010975560411e-05, "1": 1.6924421719187026e-06}, "score": 4.274918156375824}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.851736237910355, "5": 0.1359930768576864, "3": 0.012228267489857654, "2": 4.17218327093918e-05, "1": 6.098218326896275e-07}, "score": 4.1236795468841825}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8699377340084498, "4": 0.12957033731538656, "3": 0.0004890130899665161, "2": 2.617641071874444e-06, "1": 2.3444097183509788e-07}, "score": 4.869442837526655}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5866299070609531, "4": 0.41276931557602314, "3": 0.0005982804105238119, "2": 2.2532442305830513e-06, "1": 2.3657702380182282e-07}, "score": 4.586026414609996}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5967294803659867, "3": 0.39444344801943376, "5": 0.007738521734470302, "2": 0.0010817625255035413, "1": 6.67013472226563e-06}, "score": 3.6111114926743975}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9997426273560229, "4": 0.00025678612961752624, "3": 4.576363334550268e-07, "2": 6.252421551479919e-09, "1": 0}, "score": 4.999742279808847}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9242476627275723, "5": 0.053110799021945654, "3": 0.022634191901787972, "2": 7.265793824110027e-06, "1": 6.920117463310617e-08}, "score": 4.03046186827484}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9757342036344331, "4": 0.024252475120072347, "3": 1.326690459773732e-05, "2": 2.3903618208265474e-08, "1": 0}, "score": 4.975720918620889}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9712837042226836, "4": 0.02866719045149165, "3": 4.885074152300527e-05, "2": 1.3513939982058945e-07, "1": 2.1820978791687663e-08}, "score": 4.971234612555157}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6235522788395849, "5": 0.3589032950145012, "3": 0.017468772860088744, "2": 7.09117082884527e-05, "1": 4.740912169257571e-06}, "score": 4.3412784762284025}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9563207716608418, "5": 0.03441101370506564, "3": 0.00923720064248917, "2": 3.0422776594579284e-05, "1": 5.585498307200282e-07}, "score": 4.02511129268016}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9972774146762169, "4": 0.002689078524505475, "3": 3.332612280146542e-05, "2": 1.804314337072041e-07, "1": 4.500501090189375e-08}, "score": 4.9972435480389255}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9941153712549274, "4": 0.005869757252003755, "3": 1.481890244323173e-05, "2": 7.131386987808312e-08, "1": 2.7558219427995572e-08}, "score": 4.994100281041669}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9088517858220497, "4": 0.09086694366392827, "3": 0.00027998976752958174, "2": 1.113430241687443e-06, "1": 1.5998160453157358e-07}, "score": 4.908569095913256}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7697536118121253, "5": 0.21562174218885896, "3": 0.01458237020665187, "2": 4.05595213413398e-05, "1": 1.5033133287868552e-06}, "score": 4.200953785794192}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.5575889314910327, "5": 0.37485694717182066, "3": 0.06607311811114429, "2": 0.0014393634668947138, "1": 4.143784351905272e-05}, "score": 4.30578085033825}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8834512915337068, "4": 0.11591521039696037, "3": 0.0006298902248696415, "2": 3.332186042947729e-06, "1": 2.1189584079814928e-07}, "score": 4.882814157539737}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.736999658616373, "5": 0.25524005104340847, "3": 0.007743080292055272, "2": 1.6400102059717142e-05, "1": 6.862196986981775e-07}, "score": 4.247462142505738}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.641704443290994, "5": 0.34741380079995876, "3": 0.01061959499457068, "2": 0.00024826148307900274, "1": 1.3495314592282462e-05}, "score": 4.336257332782694}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7328892499385297, "5": 0.25094753138717774, "3": 0.01614645109339967, "2": 1.6360739927011188e-05, "1": 3.8874742393837603e-07}, "score": 4.234767196819422}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7252271955834805, "4": 0.27377504868276087, "3": 0.0009967475795977147, "2": 1.034351394157192e-06, "1": 0}, "score": 4.724228360328315}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6199819464475124, "5": 0.3772535919404189, "3": 0.002762860839596463, "2": 1.5571147008046983e-06, "1": 3.612668673418844e-08}, "score": 4.374487511311658}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9705525999759439, "4": 0.02937340517225555, "3": 7.353971187754744e-05, "2": 3.3890025699928847e-07, "1": 2.991660977258424e-08}, "score": 4.970478376488383}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8010589573025946, "4": 0.19859468302706845, "3": 0.0003457062956127101, "2": 6.398225273905361e-07, "1": 2.095354484248315e-08}, "score": 4.800711902574945}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8458285241925942, "5": 0.09367001983566413, "3": 0.05937573130425142, "2": 0.001103255416766274, "1": 2.2218817344261452e-05}, "score": 4.032021129265007}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9365084258201751, "4": 0.06313084510187883, "3": 0.0003591174730576339, "2": 1.558220644805931e-06, "1": 4.811634041298268e-08}, "score": 4.936146052488332}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5472421976820685, "5": 0.44626456846544754, "3": 0.006475344941480241, "2": 1.7008063548209227e-05, "1": 6.543411404521116e-07}, "score": 4.439753343980359}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.68685732956033, "4": 0.3123637515247465, "3": 0.0007762406266178428, "2": 2.4600755428890877e-06, "1": 1.5905051194321138e-07}, "score": 4.686075732220874}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7260570398188428, "4": 0.2734579819003212, "3": 0.0004831458417965777, "2": 1.5064495005199453e-06, "1": 1.2766872676801262e-07}, "score": 4.725570641967624}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8306073905335025, "4": 0.16926067445846615, "3": 0.00013185048061587832, "2": 1.466425271297455e-07, "1": 1.4347300943391538e-08}, "score": 4.830475140225797}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9512361925221465, "3": 0.03251414674154393, "5": 0.015233113514112365, "2": 0.000991197252049836, "1": 2.506264668867252e-05}, "score": 3.9806613787719627}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8487880588959861, "5": 0.1123781225165221, "3": 0.038801894741554856, "2": 3.138937807955689e-05, "1": 3.641656465079015e-07}, "score": 4.073512369041188}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7044349689464079, "4": 0.29532152527006783, "3": 0.0002429621228058925, "2": 4.3083786539292953e-07, "1": 0}, "score": 4.704191224596734}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8283486486289166, "4": 0.1704117178884947, "3": 0.0012339819263500512, "2": 5.5250735413359675e-06, "1": 1.1563235873794238e-07}, "score": 4.827103278632758}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8920889157820269, "3": 0.06731205062766096, "5": 0.04044487270005712, "2": 0.0001516708265887322, "1": 2.3030643400992806e-06}, "score": 3.972822566144037}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.94035841202699, "4": 0.0595129704161242, "3": 0.0001283962978587331, "2": 1.6182651024126059e-07, "1": 1.5438568660229715e-08}, "score": 4.9402296871248215}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8310213437833754, "5": 0.15880842141414586, "3": 0.01014866610862382, "2": 2.1059937899594394e-05, "1": 2.920642571951604e-07}, "score": 4.1486167914409755}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9604376202146904, "4": 0.039502212341417715, "3": 5.9924327504079734e-05, "2": 1.5976529578650647e-07, "1": 2.977186550376786e-08}, "score": 4.960377338497273}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.5653573895125018, "5": 0.43318527745229934, "3": 0.0014552861951551551, "2": 1.8749041872141683e-06, "1": 7.764769284713667e-08}, "score": 4.431726049212347}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7622073251905994, "5": 0.2352653153950561, "3": 0.002522264171744812, "2": 4.813408966641434e-06, "1": 2.02129955973565e-07}, "score": 4.232732836565173}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8802730196720667, "4": 0.11913313854154796, "3": 0.000590105631882944, "2": 3.2769252467400025e-06, "1": 3.670910232092117e-07}, "score": 4.879675339968351}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.6718189999845657, "4": 0.3271911900143682, "3": 0.0009881671444305045, "2": 1.4391915869076698e-06, "1": 1.2974524019563618e-07}, "score": 4.67082761480869}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9108256437460523, "4": 0.08912171137024939, "3": 5.2435956983028705e-05, "2": 9.06916994999938e-08, "1": 2.008639734468525e-08}, "score": 4.910773055537596}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9989287046470288, "4": 0.0010701215915520288, "3": 1.1032513115407983e-06, "1": 9.43672353682207e-09, "2": 0}, "score": 4.998927634093438}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9015469985284577, "5": 0.06574063838754583, "3": 0.03256042777113427, "2": 0.00015107275741653805, "1": 8.474101678050999e-07}, "score": 4.0328755233689835}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9864557323182063, "4": 0.013510238143004366, "3": 3.3723926073830314e-05, "2": 1.8976696833090859e-07, "1": 3.257560961215305e-08}, "score": 4.9864216132708306}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.929556048514068, "4": 0.07037684332289619, "3": 6.650635838907282e-05, "2": 1.0729229477500673e-07, "1": 0}, "score": 4.92948978721527}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997543063676252, "4": 0.0002455889142815773, "3": 4.136573317234335e-08, "1": 0, "2": 0}, "score": 4.999754328338688}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7380848559717064, "5": 0.25922955424421557, "3": 0.0026707677529035573, "2": 1.4204056004826697e-05, "1": 0}, "score": 4.256530536908804}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5117915324702972, "4": 0.4870971934205172, "3": 0.0011101279500341154, "2": 1.0846729987907625e-06, "1": 8.67275709218631e-08}, "score": 4.510678962101292}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9934280572992619, "4": 0.006568857224808272, "3": 3.084780666169699e-06, "2": 4.090371662472703e-09, "1": 0}, "score": 4.993424960965068}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5856475973560398, "4": 0.4140098554522294, "3": 0.0003424324999920685, "2": 1.0753107084756576e-07, "1": 0}, "score": 4.58530495398508}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997292837502586, "4": 0.0002705304220534233, "3": 8.868678004011655e-08, "1": 0, "2": 0}, "score": 4.99972929217809}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9765765104689739, "4": 0.02341646433434297, "3": 6.9662395371368975e-06, "2": 1.3308099528111878e-08, "1": 0}, "score": 4.976569562192707}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8939634037939687, "4": 0.10575895328563747, "3": 0.00027627660557390715, "2": 1.1490466033482956e-06, "1": 1.5030654423264603e-07}, "score": 4.89368443801816}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9569497976032351, "4": 0.042819541649491234, "3": 0.0002293532881964238, "2": 9.01361895643647e-07, "1": 3.290332590345482e-07}, "score": 4.956717728219892}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8510458960154416, "4": 0.1484214228262669, "3": 0.0005314822801822666, "2": 1.01751925090529e-06, "1": 2.0152104889459203e-07}, "score": 4.85051175698543}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9928139524046389, "4": 0.007182333131711959, "3": 3.655396460207647e-06, "2": 1.3200052897179914e-08, "1": 8.429469474076725e-09}, "score": 4.992810282488165}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9968307649613026, "4": 0.0031674877917467724, "3": 1.7848824486486675e-06, "2": 1.1099408703521892e-08, "1": 1.0595197548012711e-08}, "score": 4.996828866952483}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9673824530644514, "5": 0.026892702814805602, "3": 0.005717494465847683, "2": 7.134987920708333e-06, "1": 0}, "score": 4.021160942915671}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9938376403053483, "4": 0.006151565356737796, "3": 1.0520940010882228e-05, "2": 1.3057814201493767e-07, "1": 8.467859353444111e-08}, "score": 4.993826661955516}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.7725662603289483, "4": 0.22625219382161155, "3": 0.001177010299623669, "2": 4.1357122302672065e-06, "1": 4.16016464226819e-07}, "score": 4.771379718075413}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9749968214898637, "4": 0.024984208842162823, "3": 1.8711635656252143e-05, "2": 1.6177166035187057e-07, "1": 2.6110899615583265e-08}, "score": 4.974977776372642}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9836776048129023, "4": 0.016303096824205894, "3": 1.9204037779981473e-05, "2": 5.601529827706872e-08, "1": 1.7617079135766564e-08}, "score": 4.9836582562478675}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5746668887332005, "5": 0.42349685124263253, "3": 0.0018321709568978278, "2": 3.776748891609306e-06, "1": 1.0234002390350205e-07}, "score": 4.421656908306704}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.7238277711843928, "5": 0.2743821325127274, "3": 0.0017887672205465922, "2": 1.217692358266589e-06, "1": 1.219630142574707e-07}, "score": 4.27259056113631}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.572555502874797, "4": 0.4268950416784534, "3": 0.0005489237582281403, "2": 4.374882450354968e-07, "1": 2.5808421075499356e-08}, "score": 4.572005665835344}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9122945450377039, "5": 0.08646822271473247, "3": 0.0012360168343686863, "2": 1.1913243148492215e-06, "1": 2.0191502285199193e-08}, "score": 4.0852297629894005}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.5658651387101964, "4": 0.43381255894745924, "3": 0.0003220409005965837, "2": 2.4687702470202456e-07, "1": 1.5906722791606627e-08}, "score": 4.565542555576425}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8774967038021478, "4": 0.12196338527388169, "3": 0.0005379574984966175, "2": 1.806847398705967e-06, "1": 1.3196778462734028e-07}, "score": 4.876954749518064}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8275539148136382, "4": 0.1716152373713598, "3": 0.0008303684832250253, "2": 4.997741702765355e-07, "1": 3.150274979013131e-08}, "score": 4.8267224093296095}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8701843702132401, "4": 0.12964687119397506, "3": 0.00016862824495567726, "2": 8.73437809334006e-08, "1": 2.2632611138951e-08}, "score": 4.8700155171063555}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9514614728760258, "4": 0.0484660948870029, "3": 7.207422984236403e-05, "2": 2.516061170037819e-07, "1": 7.118476614916695e-08}, "score": 4.951388715383988}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8511597991093608, "4": 0.14875419994955577, "3": 8.592824246067538e-05, "2": 1.1369845780525308e-07, "1": 0}, "score": 4.851073608576107}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "human", "scores": {"5": 0.7843050813106861, "4": 0.21534252048214444, "3": 0.00035209564518486096, "2": 2.935464346914025e-07, "1": 1.4391789019117848e-08}, "score": 4.783952351182549}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9444146475411136, "4": 0.055538100403613504, "3": 4.712999137656037e-05, "2": 5.61463029677494e-08, "1": 7.44897051507103e-09}, "score": 4.944367438126084}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8961941761798133, "4": 0.10349969636008523, "3": 0.0003056029034191277, "2": 4.219242674645193e-07, "1": 6.210564191750783e-08}, "score": 4.895887579418365}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.786748476096324, "4": 0.2128815225897733, "3": 0.00036865942780187413, "2": 1.2215060418576275e-06, "1": 8.744428405969527e-08}, "score": 4.786377137223527}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8236199756953974, "5": 0.1752625225974521, "3": 0.0011167412868512531, "2": 6.598330423919871e-07, "1": 1.3425526224016691e-08}, "score": 4.174144436546667}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9153786446651826, "4": 0.08437282566650091, "3": 0.0002476614166631674, "2": 8.062249815125489e-07, "1": 5.484065711065276e-08}, "score": 4.915129212852715}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9607527713230962, "4": 0.038869099552596736, "3": 0.0003762636362624228, "2": 1.4297527939501008e-06, "1": 3.5163328794688155e-07}, "score": 4.960372674050609}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9932357338415677, "4": 0.006763796054580112, "3": 4.3641116455855366e-07, "2": 1.86562074516268e-09, "1": 0}, "score": 4.993235325310929}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9997627567966206, "4": 0.00023680725920447213, "3": 3.2368921320553123e-07, "2": 9.314486132571406e-09, "1": 0}, "score": 4.999762517394464}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9976498359699892, "4": 0.0023479882060638614, "3": 2.1010465084638213e-06, "2": 1.992598854900425e-08, "1": 0}, "score": 4.997647749793931}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7245391655154843, "5": 0.2697415771456433, "3": 0.005707571227534987, "2": 1.1307684716242554e-05, "1": 3.8543009357920515e-07}, "score": 4.264010232409407}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9368563002789896, "4": 0.06305439578304237, "3": 8.917846243991243e-05, "2": 9.989711805563149e-08, "1": 0}, "score": 4.936766945983323}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9510349636220512, "4": 0.0489300378562311, "3": 3.490595894224758e-05, "2": 4.789795627176577e-08, "1": 0}, "score": 4.95100000434344}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9822574263719932, "4": 0.017717667028618288, "3": 2.4850715825037423e-05, "2": 8.643544519080814e-08, "1": 1.924416382697084e-08}, "score": 4.982232296141502}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.815886946151037, "5": 0.1813150233618459, "3": 0.002791176744074463, "2": 6.531466898571158e-06, "1": 1.218423306216124e-07}, "score": 4.1785104539365125}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7162087530329189, "3": 0.2677445833797234, "5": 0.01344650577993232, "2": 0.0025925534523546195, "1": 7.454341079789647e-06}, "score": 3.7404944135427916}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8288095042993651, "5": 0.14978768812924909, "3": 0.021324954910561376, "2": 7.687737023405399e-05, "1": 1.0226666289582624e-06}, "score": 4.128305904399706}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5723887703661849, "4": 0.40289252095002803, "3": 0.024407959276940068, "2": 0.00029963245033109065, "1": 1.0925424083765907e-05}, "score": 4.547348874751393}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8419696335985096, "4": 0.1576185981428806, "3": 0.0004103763058738134, "2": 1.2518426150715393e-06, "1": 1.0760916675038363e-07}, "score": 4.8415564581312935}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8880044186900844, "4": 0.11178076291681807, "3": 0.0002141264135123086, "2": 5.536395465235779e-07, "1": 4.817209140877749e-08}, "score": 4.887789120531328}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5695755754402176, "4": 0.42750628027990567, "3": 0.002911274561637822, "2": 6.576065104105831e-06, "1": 3.19410412981997e-07}, "score": 4.566650175921766}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9604830442256339, "4": 0.039191793640783956, "3": 0.0003216286303184091, "2": 2.813855362068902e-06, "1": 6.029569715874605e-07}, "score": 4.96015409105495}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7094533323149186, "5": 0.26246598140399985, "3": 0.028052492269440468, "2": 2.749085923501589e-05, "1": 7.176097064680752e-07}, "score": 4.234356351198809}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9580275754796674, "4": 0.04176069052433683, "3": 0.0002104875608367576, "2": 1.035557115727831e-06, "1": 1.6824980961203756e-07}, "score": 4.957814552885113}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9062386563705054, "4": 0.09322967562295796, "3": 0.0005284694285618759, "2": 2.7525687262401973e-06, "1": 3.454430641285394e-07}, "score": 4.905703736558468}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5182366747543454, "5": 0.4786519804614429, "3": 0.003103555156235264, "2": 7.0981171445129574e-06, "1": 2.9112998082509524e-07}, "score": 4.475533546075503}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8524056674198828, "5": 0.11503448799153639, "3": 0.03249279846150669, "2": 6.495356032193425e-05, "1": 1.944505217782259e-06}, "score": 4.082405961094886}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6332035592115504, "5": 0.3650260712019326, "3": 0.0017695611517539501, "2": 7.537832327447486e-07, "1": 3.019670573916528e-08}, "score": 4.3632549207769316}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9662027042640853, "4": 0.03373572210212245, "3": 6.125377976466121e-05, "2": 1.985823423326227e-07, "1": 0}, "score": 4.966141170485204}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9752427808316053, "4": 0.02473892165682182, "3": 1.8121454321531078e-05, "2": 3.963972757442657e-08, "1": 0}, "score": 4.975224713135568}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8228379494012333, "5": 0.17401240312160435, "3": 0.0031423605310883576, "2": 6.840860706244551e-06, "1": 1.823242758204158e-07}, "score": 4.170855858961404}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.8611599323033615, "4": 0.1386334887277152, "3": 0.00020525201343678937, "2": 1.1118830928408938e-06, "1": 1.2107689467598508e-07}, "score": 4.860952174218685}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9028907125192396, "4": 0.09672419509615963, "3": 0.0003842790794286719, "2": 6.479832433216598e-07, "1": 0}, "score": 4.90250528667724}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8281880142692187, "4": 0.17148978102697363, "3": 0.0003198235885390074, "2": 1.8806144488998263e-06, "1": 0}, "score": 4.827864843798815}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9697225920153556, "4": 0.030234706276170937, "3": 4.240323082188357e-05, "2": 1.9741395863704517e-07, "1": 0}, "score": 4.969679891956047}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "human", "scores": {"5": 0.5143328268629073, "4": 0.48477718789799, "3": 0.0008893168271013306, "2": 6.536550964887464e-07, "1": 6.537473291499205e-08}, "score": 4.513441980612096}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9311355091883001, "4": 0.0687776459744927, "3": 8.672156273214961e-05, "2": 3.452041323211379e-08, "1": 4.145530794431648e-09}, "score": 4.93104878492282}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9878406289266557, "4": 0.012144890896222647, "3": 1.4346034434171737e-05, "2": 7.790708743565857e-09, "1": 0}, "score": 4.987826392124624}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9739663053836025, "4": 0.02601534299026126, "3": 1.8235505731098554e-05, "1": 0, "2": 0}, "score": 4.973948182973129}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8812975225603613, "5": 0.11737675376623112, "3": 0.0013252882447440319, "2": 2.704947898576734e-07, "1": 0}, "score": 4.116050943672639}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7653355300044768, "5": 0.22917384842929595, "3": 0.005484863892812104, "2": 5.670620560030056e-06, "1": 7.651898170726155e-08}, "score": 4.223677416094608}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9363936356529712, "4": 0.06354639563179956, "3": 5.9692211900711554e-05, "2": 1.9771939665985352e-07, "1": 2.3284591596605173e-08}, "score": 4.936333530114395}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.5077388694913633, "4": 0.4897688910784617, "3": 0.0024906812787627033, "2": 1.4876646746603921e-06, "1": 4.158621894182173e-08}, "score": 4.505245102726439}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9046695536936877, "4": 0.09521117115537776, "3": 0.0001189531309497659, "2": 2.15730261284546e-07, "1": 2.2723322886052074e-08}, "score": 4.904550176522249}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9395665914222122, "4": 0.06035064764579438, "3": 8.246422459054144e-05, "2": 1.8864347103761635e-07, "1": 1.9582294907425173e-08}, "score": 4.939483774290858}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "human", "scores": {"4": 0.9717563817459528, "3": 0.01804764632883813, "5": 0.010190378379531963, "2": 5.3869726032199474e-06, "1": 3.561749098297378e-08}, "score": 3.99213184990791}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8279593168857132, "5": 0.14490584388492214, "3": 0.027005225355971607, "2": 0.0001276520952996276, "1": 1.802143082278392e-06}, "score": 4.117639926688556}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7878290139834989, "5": 0.20856605027923006, "3": 0.0036044020098262275, "2": 5.479312577110711e-07, "1": 2.6000085772189634e-08}, "score": 4.20496046616642}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.5286931881360083, "5": 0.4690488444546169, "3": 0.0022561442653138072, "2": 1.755670013200745e-06, "1": 5.968381254289129e-08}, "score": 4.466789013434235}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.6472772629710136, "4": 0.35057865138715055, "3": 0.0021380779665404787, "2": 5.522057674588943e-06, "1": 3.095271582138137e-07}, "score": 4.645127325908417}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7200390372780979, "5": 0.2743358207175847, "3": 0.005613420670945885, "2": 1.1187091376902072e-05, "1": 3.880032969753851e-07}, "score": 4.268698901148172}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7515548688594721, "4": 0.2479982225450241, "3": 0.0004456767698352497, "2": 1.1409275340645125e-06, "1": 1.0077152613834989e-07}, "score": 4.75110660050402}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6248813732878469, "5": 0.3723573379087716, "3": 0.0027597325668959403, "2": 1.4543543522245035e-06, "1": 6.90432304689988e-08}, "score": 4.369594501640558}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9936109157524642, "4": 0.0063789523727924725, "3": 1.0027943619415477e-05, "2": 6.115923280677218e-08, "1": 1.822240419859565e-08}, "score": 4.993600735215555}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8030145063544349, "4": 0.19661008018990922, "3": 0.00037402971942634907, "2": 1.2013483583666904e-06, "1": 8.715418896371078e-08}, "score": 4.802637888913887}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7191953941318917, "5": 0.2776094802988946, "3": 0.003190505853474931, "2": 4.268239973017826e-06, "1": 1.609635331164155e-07}, "score": 4.274410007353337}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.6818384336571969, "4": 0.3173178582712254, "3": 0.0008428114419593256, "2": 8.520965456894631e-07, "1": 4.0534271937409246e-08}, "score": 4.680993799142488}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5687395969279236, "5": 0.4238283672174393, "3": 0.007422455103855681, "2": 9.041856858061647e-06, "1": 4.48365539877806e-07}, "score": 4.416386520998047}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9314533227176038, "4": 0.06847971561333009, "3": 6.664603519871292e-05, "2": 2.3125172525951959e-07, "1": 3.2023206303198416e-08}, "score": 4.931386166875725}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9777678679055652, "4": 0.02220713600696624, "3": 2.491630872541394e-05, "2": 6.409881243156931e-08, "1": 1.4945747884603443e-08}, "score": 4.977742779279812}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "human", "scores": {"4": 0.585954228979027, "5": 0.4001092476657618, "3": 0.01388774197813571, "2": 4.691538021112805e-05, "1": 1.6649907335213455e-06}, "score": 4.386122757568045}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "claude", "scores": {"3": 0.7757277639520095, "4": 0.11137094526547625, "2": 0.11029639906409232, "5": 0.0023033193518445403, "1": 0.0003013762722460786}, "score": 3.0050784333564327}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.6463675720729551, "5": 0.3499564012902591, "3": 0.0036724987143176234, "2": 3.3557978720570697e-06, "1": 9.202164645672981e-08}, "score": 4.346276942653063}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9578464295930276, "4": 0.04209470576508203, "3": 5.8690481459170474e-05, "2": 1.2232835172293308e-07, "1": 0}, "score": 4.957787544098986}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7574433120321941, "5": 0.22261127278074336, "3": 0.019906077338110666, "2": 3.8642842023187293e-05, "1": 6.039653549566507e-07}, "score": 4.202626116309922}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "human", "scores": {"3": 0.7145141626822907, "4": 0.283390237527174, "2": 0.0016404258602016606, "5": 0.00045419542545363365, "1": 9.8345692277528e-07}, "score": 3.282656234204308}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9830264487915878, "3": 0.012321154695310413, "5": 0.004640278003459926, "2": 1.1966427947667634e-05, "1": 4.592951032490833e-08}, "score": 3.9922950518458267}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.9890841173934858, "3": 0.007800464467063686, "5": 0.003103899669977766, "2": 1.1437821711234562e-05, "1": 1.5357482843999925e-08}, "score": 3.995280513178906}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "gpt4", "scores": {"4": 0.9299606123904978, "5": 0.06857357654579108, "3": 0.0014635834977384465, "2": 1.9589381338015678e-06, "1": 0}, "score": 4.06710609319835}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.8597789565836987, "3": 0.13931914088368666, "2": 0.0005067769966254336, "5": 0.0003941351843606195, "1": 1.1189307680837485e-06}, "score": 3.8600581015087276}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "human", "scores": {"5": 0.615453779752135, "4": 0.38210967662516643, "3": 0.0024305031146361323, "2": 5.6870209830191755e-06, "1": 3.608916724360069e-07}, "score": 4.613010815381419}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.9394247651548872, "5": 0.05252753346008436, "3": 0.008037954046524676, "2": 9.460772676112301e-06, "1": 1.583035412200187e-07}, "score": 4.044470188661433}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9605225247320817, "4": 0.03941222230487643, "3": 6.484362213468367e-05, "2": 3.369794121510917e-07, "1": 0}, "score": 4.960457076651232}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9387707427588494, "4": 0.06114091481528305, "3": 8.800349749627483e-05, "2": 2.2865123170482032e-07, "1": 2.5959012113866177e-08}, "score": 4.938682283229785}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6524714340352173, "5": 0.346309567560957, "3": 0.0012165570500062485, "2": 2.1536747258237835e-06, "1": 7.274744876733243e-08}, "score": 4.345088559089605}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "human", "scores": {"5": 0.8046703890574587, "4": 0.19413835577668345, "3": 0.0011877642743432241, "2": 3.2638600454955033e-06, "1": 1.4115574241595804e-07}, "score": 4.803475742594861}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9710423148597638, "4": 0.02844174837563875, "3": 0.0005134183746720903, "2": 2.294861648837132e-06, "1": 1.0866848622349603e-07}, "score": 4.97052409223053}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9994999930451615, "4": 0.0004985827421944585, "3": 1.3608555161451723e-06, "2": 7.934813394545599e-09, "1": 0}, "score": 4.999498671714548}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.9944860197037912, "4": 0.005495702806680817, "3": 1.8247545137448173e-05, "2": 5.884599852672656e-08, "1": 1.1258347313582988e-08}, "score": 4.994467580753841}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.9471948101656072, "4": 0.05250996593847375, "3": 0.0002947346788648781, "2": 3.9536596788804984e-07, "1": 3.296821241053769e-08}, "score": 4.946899243500117}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "human", "scores": {"4": 0.6968929477823803, "5": 0.29866390540912546, "3": 0.004441831889072207, "2": 1.309040672618661e-06, "1": 3.7614282686315565e-08}, "score": 4.294219333258652}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.5136404869407428, "4": 0.48557282621375364, "3": 0.0007863894537635852, "2": 2.366693068351272e-07, "1": 4.5338603180767924e-08}, "score": 4.512853496022207}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.7548176893134256, "5": 0.23988959075767816, "3": 0.005291245587782656, "2": 1.4360317177679955e-06, "1": 2.3459882552990577e-08}, "score": 4.234595406210441}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8798950147916366, "4": 0.1200102407809594, "3": 9.458780513443573e-05, "2": 1.5297413226673558e-07, "1": 2.4756692015855433e-08}, "score": 4.879800028196854}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.579861730240278, "5": 0.4199128454799853, "3": 0.000225073397014746, "2": 2.4384330757746474e-07, "1": 2.7623941350407575e-08}, "score": 4.419687234854191}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "human", "scores": {"5": 0.663248160123366, "4": 0.33588454303167997, "3": 0.0008663534428881678, "2": 8.96718363696941e-07, "1": 5.390729634559764e-08}, "score": 4.662379846737098}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8008686883473772, "5": 0.19527702256850926, "3": 0.003849919653965797, "2": 4.219314010009249e-06, "1": 1.0819431646106002e-07}, "score": 4.19141834772818}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.5307874608070944, "5": 0.46739018791748066, "3": 0.0018215199300797992, "2": 7.722658352626779e-07, "1": 2.782780879126913e-08}, "score": 4.465567054522065}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.6904040106922487, "4": 0.3093383553587108, "3": 0.00025748914347794314, "2": 1.0378503999122523e-07, "1": 1.1998322363181238e-08}, "score": 4.690146298013287}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.9157161886829386, "5": 0.07904932928941755, "3": 0.0052299921597406245, "2": 4.4101229018218815e-06, "1": 5.940377858849981e-08}, "score": 4.073810340173931}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.8207283182056966, "5": 0.1188813787797439, "3": 0.06035265132055705, "2": 3.7371693439995744e-05, "1": 2.2471992228069658e-07}, "score": 4.058453313143877}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8938388082824064, "5": 0.07579153257707513, "3": 0.03019503717677941, "2": 0.00017192056830485212, "1": 2.357063484317172e-06}, "score": 4.0452455986527385}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8615963409131578, "3": 0.1069734078686116, "5": 0.031346790297486014, "2": 8.330495722982798e-05, "1": 2.3350461396763228e-07}, "score": 3.9242060778777166}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8603161336624439, "4": 0.13946628381718043, "3": 0.0002173573031977759, "2": 2.45934400797465e-07, "1": 0}, "score": 4.860098266671597}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8067830677870781, "4": 0.19276161672538047, "3": 0.0004538393396387561, "2": 1.3117689344340807e-06, "1": 0}, "score": 4.8063267374527285}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "human", "scores": {"5": 0.9389919432022324, "4": 0.06082447631801527, "3": 0.0001826998345798981, "2": 7.020866552582068e-07, "1": 1.292747309355849e-07}, "score": 4.938807497638137}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.7185312363621783, "4": 0.2809877513781608, "3": 0.00047918059814210817, "2": 1.629459814856314e-06, "1": 1.125427148285561e-07}, "score": 4.718048523595767}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.9393089487365073, "4": 0.060640990723069, "3": 4.980789760805745e-05, "2": 1.2348378315329412e-07, "1": 0}, "score": 4.939259015185119}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.8718630850136074, "4": 0.12786264208076253, "3": 0.0002731241784724864, "2": 1.0696810906890716e-06, "1": 9.787320720436364e-08}, "score": 4.871587511443832}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.7216489623896907, "4": 0.2774388307010546, "3": 0.0009079362419001803, "2": 3.7592954441336374e-06, "1": 2.876276716433603e-07}, "score": 4.7207328059337}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "human", "scores": {"4": 0.7578572466755201, "5": 0.2396627385452228, "3": 0.002474782909851063, "2": 4.894389543369177e-06, "1": 2.9549468107749636e-07}, "score": 4.237177290330174}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.8886869168661543, "3": 0.06874929479605447, "5": 0.04149488966210866, "2": 0.0010579337136642883, "1": 1.0802229607522432e-05}, "score": 3.9705973159651338}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8814474440194074, "4": 0.11835741403388707, "3": 0.00019459462682030904, "2": 4.3974624161737614e-07, "1": 5.863558922803295e-08}, "score": 4.881251837120086}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.7655262753844412, "4": 0.23374724429386218, "3": 0.0007227910367907293, "2": 3.2739347793458285e-06, "1": 3.09890136707089e-07}, "score": 4.76479608746307}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.6025620930038389, "5": 0.39648655804807487, "3": 0.0009479201397763023, "2": 3.220438588740486e-06, "1": 1.7198974224875715e-07}, "score": 4.3955316954513295}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "human", "scores": {"4": 0.5023376880918068, "5": 0.4930859891333942, "3": 0.004568921945702907, "2": 6.91433337667497e-06, "1": 3.7740120919605157e-07}, "score": 4.488502159610214}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "claude", "scores": {"5": 0.9980957911106003, "4": 0.0018957381333686472, "3": 8.363145045490942e-06, "2": 4.5031886915094e-08, "1": 3.012320596313208e-08}, "score": 4.9980872799259775}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt35", "scores": {"4": 0.8824937256014647, "5": 0.09754216821151866, "3": 0.019932320879140136, "2": 3.09284835784719e-05, "1": 6.851877148142985e-07}, "score": 4.0775459481117995}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.974856317997655, "4": 0.025031018079371813, "3": 0.00011224787078832361, "2": 3.0154999911025144e-07, "1": 6.236360406045951e-08}, "score": 4.974743330757791}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "gpt35", "target_model": "llama", "scores": {"5": 0.8145269448713387, "4": 0.18513934892728112, "3": 0.0003328638534778484, "2": 6.636705302468119e-07, "1": 1.13628327494213e-07}, "score": 4.814192465754261}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "human", "scores": {"4": 0.86515132080776, "5": 0.10109683086349422, "3": 0.033315504158631506, "2": 0.00043309411409998914, "1": 3.1263245768160153e-06}, "score": 4.06690576778128}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "claude", "scores": {"4": 0.6666797855345198, "5": 0.3279171152302921, "3": 0.005202351209048704, "2": 0.00018932375859330282, "1": 1.012747024412774e-05}, "score": 4.322306152059074}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt35", "scores": {"5": 0.8625253924398625, "4": 0.13716495861392802, "3": 0.00030525563038007484, "2": 4.048350677152091e-06, "1": 2.3642613579902824e-07}, "score": 4.862211424413301}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "gpt4", "scores": {"5": 0.961059318606055, "4": 0.03856192840450501, "3": 0.00037125440596447884, "2": 6.503045190006436e-06, "1": 7.956527420455373e-07}, "score": 4.960672863176101}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "gpt35", "target_model": "llama", "scores": {"4": 0.7984071089731795, "5": 0.18098659703291864, "3": 0.020265579970345313, "2": 0.0003359790671804445, "1": 4.660718207132478e-06}, "score": 4.160035088654303}]