,model,Rating,Rating std,Rating alpha,Role playing Rating,Role playing Rating std,Role playing Rating alpha,llama Rating,llama Rating std,llama Rating alpha,Planning Rating,Planning Rating std,Planning Rating alpha,Information seeking Rating,Information seeking Rating std,Information seeking Rating alpha,Advice seeking Rating,Advice seeking Rating std,Advice seeking Rating alpha,Creative Writing Rating,Creative Writing Rating std,Creative Writing Rating alpha,Data Analysis Rating,Data Analysis Rating std,Data Analysis Rating alpha,Coding & Debugging Rating,Coding & Debugging Rating std,Coding & Debugging Rating alpha,Math Rating,Math Rating std,Math Rating alpha,claude Rating,claude Rating std,claude Rating alpha,Brainstorming Rating,Brainstorming Rating std,Brainstorming Rating alpha,Reasoning Rating,Reasoning Rating std,Reasoning Rating alpha,Editing Rating,Editing Rating std,Editing Rating alpha
openai/gpt-4o-2024-05-13,openai/gpt-4o-2024-05-13,1609.9391772545994,0.0,"[-6.237611459958771, -6.237611459958771]",-5.93686723501439,0.0,"[-2.132611722904875, -2.132611722904875]",2.7428480451556423,0.0,"[-3.831489011240887, -3.831489011240887]",0.06126642653295821,0.0,"[1.9397915756155724, 1.9397915756155724]",-2.293820738518728,0.0,"[-0.6953173385765692, -0.6953173385765692]",-0.8926921638715692,0.0,"[0.728271910358607, 0.728271910358607]",-9.321361408796852,0.0,"[3.533480951296694, 3.533480951296694]",2.3522622191751097,0.0,"[1.2961657322547462, 1.2961657322547462]",17.236067880086523,0.0,"[-2.7746482054264803, -2.7746482054264803]",10.681722593254143,0.0,"[-0.6758603218886812, -0.6758603218886812]",1.5914547125199492,0.0,"[-0.43923628750804933, -0.43923628750804933]",-3.039539976936626,0.0,"[-0.2011950847591839, -0.2011950847591839]",0.1348652787543895,0.0,"[1.076620766750422, 1.076620766750422]",-8.981902874664982,0.0,"[-2.0946982627202857, -2.0946982627202857]"
openai/gpt-4-turbo-2024-04-09,openai/gpt-4-turbo-2024-04-09,1601.6100708345891,0.0,"[-9.173347306699725, -9.173347306699725]",-3.5902532573442216,0.0,"[-3.830307018687984, -3.830307018687984]",0.19124993291482287,0.0,"[1.3935843812773208, 1.3935843812773208]",-18.906336029063553,0.0,"[-0.20499796602809894, -0.20499796602809894]",-25.326719989155702,0.0,"[1.7468081489925922, 1.7468081489925922]",-20.50084342078637,0.0,"[-3.1363869081379256, -3.1363869081379256]",-6.9947359486606615,0.0,"[-1.8464973503695532, -1.8464973503695532]",2.419444328398674,0.0,"[1.4681178616822672, 1.4681178616822672]",49.660330952707895,0.0,"[-1.2872674158678024, -1.2872674158678024]",55.400622212132404,0.0,"[2.6145446003127972, 2.6145446003127972]",1.9186719044495413,0.0,"[5.079371679036813, 5.079371679036813]",-4.057858671983582,0.0,"[3.126719647714765, 3.126719647714765]",-3.8741986829762127,0.0,"[-0.060257990928246574, -0.060257990928246574]",-24.22945149326968,0.0,"[1.4095243913158804, 1.4095243913158804]"
openai/gpt-4-0125-preview,openai/gpt-4-0125-preview,1586.8340586158577,0.0,"[-7.8462765145861795, -7.8462765145861795]",-3.076695830218164,0.0,"[2.167250978668784, 2.167250978668784]",0.6131798323686377,0.0,"[-1.1828056894108128, -1.1828056894108128]",-2.944612391449758,0.0,"[-0.9090160264220808, -0.9090160264220808]",-4.729211233272771,0.0,"[-2.7358044091824127, -2.7358044091824127]",-2.578739528879763,0.0,"[0.11807856169809172, 0.11807856169809172]",0.6808634520838139,0.0,"[-1.3497205058004562, -1.3497205058004562]",0.21355863646354076,0.0,"[2.2085484013777332, 2.2085484013777332]",13.43216263106668,0.0,"[-1.4718092412326804, -1.4718092412326804]",3.693029682019359,0.0,"[1.7757979098894126, 1.7757979098894126]",1.509920380286958,0.0,"[1.2976502229807765, 1.2976502229807765]",0.11623280876368591,0.0,"[-1.7611877070138173, -1.7611877070138173]",-2.728785606957529,0.0,"[0.8810826478965836, 0.8810826478965836]",-2.077802619619105,0.0,"[1.0767793901208553, 1.0767793901208553]"
google/gemini-1.5-pro,google/gemini-1.5-pro,1578.8264751085844,0.0,"[-7.86547695789136, -7.86547695789136]",-5.445658324526016,0.0,"[-2.0752124960862535, -2.0752124960862535]",-1.5644604774442257,0.0,"[-2.7838260347146804, -2.7838260347146804]",-2.1356906796841475,0.0,"[1.719665522951932, 1.719665522951932]",-8.99890964690573,0.0,"[-0.424234247892052, -0.424234247892052]",-3.5338952517953346,0.0,"[-1.513425709631448, -1.513425709631448]",-15.123220190446883,0.0,"[-1.8020468387648272, -1.8020468387648272]",-2.3662005641246857,0.0,"[1.8791875271244765, 1.8791875271244765]",25.54727999240271,0.0,"[-1.1164472074635512, -1.1164472074635512]",12.398451949475755,0.0,"[0.5802843868915861, 0.5802843868915861]",0.15917597072203965,0.0,"[-1.9188754891327469, -1.9188754891327469]",1.9651923550351484,0.0,"[0.3019359812726108, 0.3019359812726108]",0.9662930884104121,0.0,"[2.2308193129390954, 2.2308193129390954]",-3.273642727841397,0.0,"[0.2194737686582302, 0.2194737686582302]"
meta-llama/Meta-Llama-3-70B-Instruct,meta-llama/Meta-Llama-3-70B-Instruct,1576.7197702999727,0.0,"[-11.681444820802199, -11.681444820802199]",1.099877868897648,0.0,"[0.3582848904039454, 0.3582848904039454]",0.4724349082885056,0.0,"[2.7473790809273044, 2.7473790809273044]",-5.020750845189553,0.0,"[-2.5249435410449648, -2.5249435410449648]",-2.378285138944485,0.0,"[0.8329267191476983, 0.8329267191476983]",-3.4717410853122663,0.0,"[-0.8764805250925596, -0.8764805250925596]",-5.6270710686044865,0.0,"[1.8874329819049516, 1.8874329819049516]",0.4068843364277515,0.0,"[-0.5592426218668369, -0.5592426218668369]",9.568938733431937,0.0,"[1.6408780238292602, 1.6408780238292602]",10.442385671775263,0.0,"[-1.4841853027943532, -1.4841853027943532]",0.588781755272635,0.0,"[-2.3497636543421305, -2.3497636543421305]",0.401501132898731,0.0,"[-0.37602629101326224, -0.37602629101326224]",-3.3283356592503166,0.0,"[-1.414888584987033, -1.414888584987033]",-2.093403946130286,0.0,"[2.5162442515131223, 2.5162442515131223]"
anthropic/claude-3-opus-20240229,anthropic/claude-3-opus-20240229,1568.1497024822097,0.0,"[-10.067252849698434, -10.067252849698434]",-2.3121030829009763,0.0,"[-0.966895757382817, -0.966895757382817]",-1.7245173043804771,0.0,"[2.3270914803493676, 2.3270914803493676]",-4.095814095515669,0.0,"[1.0078035338140214, 1.0078035338140214]",-2.685004538225291,0.0,"[-4.499251331255196, -4.499251331255196]",-0.5590404454066705,0.0,"[-0.5080887765732226, -0.5080887765732226]",-14.896617843179191,0.0,"[-2.1130777773237384, -2.1130777773237384]",0.005135084751376831,0.0,"[1.9429090312424906, 1.9429090312424906]",17.60356217534719,0.0,"[-0.21374537269335647, -0.21374537269335647]",11.230806699255446,0.0,"[1.556058669606875, 1.556058669606875]",-0.31904956794736805,0.0,"[-0.8316093355381718, -0.8316093355381718]",-3.985231174785117,0.0,"[1.2979571416404099, 1.2979571416404099]",-1.9277822285147443,0.0,"[1.7446255221929274, 1.7446255221929274]",1.6220894491735887,0.0,"[0.7517051167315114, 0.7517051167315114]"
google/gemini-1.5-flash,google/gemini-1.5-flash,1556.7892808988079,0.0,"[-13.852458715635976, -13.852458715635976]",-4.422627889703555,0.0,"[1.3726721298756788, 1.3726721298756788]",-4.461530510735487,0.0,"[-3.855381274616718, -3.855381274616718]",-2.6748989969660357,0.0,"[1.5345112959362046, 1.5345112959362046]",-9.956822115790231,0.0,"[-0.8129622822626299, -0.8129622822626299]",-2.9769029601444057,0.0,"[-0.7834861457921378, -0.7834861457921378]",-19.288086562635897,0.0,"[-0.4807251586510297, -0.4807251586510297]",3.3174150290166073,0.0,"[0.36662111867635216, 0.36662111867635216]",22.35306404323891,0.0,"[-3.095707046302252, -3.095707046302252]",12.798472866053034,0.0,"[-0.27286505206533107, -0.27286505206533107]",-2.0757151828495024,0.0,"[4.916443969700573, 4.916443969700573]",0.7941235895836919,0.0,"[0.7283766499007958, 0.7283766499007958]",0.9252901912653491,0.0,"[2.528986829093782, 2.528986829093782]",-0.8690271939173141,0.0,"[-1.085422338409269, -1.085422338409269]"
01-ai/Yi-1.5-34B-Chat,01-ai/Yi-1.5-34B-Chat,1555.105353389833,0.0,"[-12.021611486977235, -12.021611486977235]",-2.0370983761824535,0.0,"[3.5492987206965783, 3.5492987206965783]",0.13670791935523127,0.0,"[-5.46937638711105, -5.46937638711105]",-1.8841142531063197,0.0,"[-0.8287866104911277, -0.8287866104911277]",-4.329199345080619,0.0,"[1.294062461575697, 1.294062461575697]",0.8407494876209067,0.0,"[-0.3146474102207404, -0.3146474102207404]",2.819244745759249,0.0,"[-0.43437326102852625, -0.43437326102852625]",-0.45665402039261255,0.0,"[1.5576854000360452, 1.5576854000360452]",-1.9393814622083363,0.0,"[-2.284142454141784, -2.284142454141784]",6.574579895439849,0.0,"[0.9879788914568932, 0.9879788914568932]",0.06744655553622327,0.0,"[3.739335326070586, 3.739335326070586]",-1.411483847218453,0.0,"[-3.3905090110162694, -3.3905090110162694]",2.7742549059656167,0.0,"[-0.3050285898427334, -0.3050285898427334]",-0.9508977305969305,0.0,"[0.1684618629759579, 0.1684618629759579]"
yi/yi-large,yi/yi-large,1553.1349046158202,0.0,"[-9.901607940521444, -9.901607940521444]",-0.2277676593547194,0.0,"[1.6556404491134786, 1.6556404491134786]",-2.8519491188279726,0.0,"[-2.808933595901427, -2.808933595901427]",-2.3630962410809753,0.0,"[-1.3110216827592291, -1.3110216827592291]",-7.605077507095061,0.0,"[0.5205663883812406, 0.5205663883812406]",0.15679434083051755,0.0,"[0.6645785409995172, 0.6645785409995172]",-5.405570725320421,0.0,"[4.548090785938382, 4.548090785938382]",1.889603200653936,0.0,"[0.24961337791864846, 0.24961337791864846]",7.607954695510615,0.0,"[-3.524514437723826, -3.524514437723826]",4.846381563769915,0.0,"[0.8791601565076097, 0.8791601565076097]",-0.0905611039329326,0.0,"[6.6656474604573965, 6.6656474604573965]",0.11193631701688785,0.0,"[-0.9370973200240948, -0.9370973200240948]",4.580384742765151,0.0,"[-1.6394315581482974, -1.6394315581482974]",-3.5915427276959218,0.0,"[-1.1055847002035306, -1.1055847002035306]"
deepseek/deepseekv2-chat,deepseek/deepseekv2-chat,1547.277367613581,0.0,"[-8.977229805590696, -8.977229805590696]",-0.9319466696255766,0.0,"[0.3529226288779165, 0.3529226288779165]",0.5226626876847331,0.0,"[-1.9043836735706354, -1.9043836735706354]",-3.180602599333846,0.0,"[0.6126565009065361, 0.6126565009065361]",-3.5073381480938775,0.0,"[0.32921027785012136, 0.32921027785012136]",0.14709719910036906,0.0,"[0.06196158759932198, 0.06196158759932198]",-2.060337818875614,0.0,"[-0.5095267645505592, -0.5095267645505592]",1.492455842437886,0.0,"[-0.34668385617793285, -0.34668385617793285]",5.862361707064683,0.0,"[-1.1741660826760558, -1.1741660826760558]",9.059656651459683,0.0,"[2.47134486418436, 2.47134486418436]",-2.4471542263926627,0.0,"[0.3529856619042926, 0.3529856619042926]",-2.3058587245448634,0.0,"[0.28787567644029766, 0.28787567644029766]",-2.38024558878041,0.0,"[-2.247861632850677, -2.247861632850677]",-2.1952418508084586,0.0,"[0.16226680039667007, 0.16226680039667007]"
princeton-nlp/Llama-3-Instruct-8B-SimPO,princeton-nlp/Llama-3-Instruct-8B-SimPO,1543.0979344535508,0.0,"[-12.281134387052589, -12.281134387052589]",0.7419383238923344,0.0,"[3.0704717070430525, 3.0704717070430525]",0.5297946065088962,0.0,"[-0.782600186722162, -0.782600186722162]",1.5013695842024293,0.0,"[-1.7875562537701832, -1.7875562537701832]",9.991662819939227,0.0,"[0.5515451681835692, 0.5515451681835692]",0.10821390693527448,0.0,"[-0.4133943065689584, -0.4133943065689584]",4.342329168376972,0.0,"[3.6670936777208154, 3.6670936777208154]",-0.5557743516146043,0.0,"[-0.36409206254611093, -0.36409206254611093]",-3.768967704888358,0.0,"[-0.4946022268043033, -0.4946022268043033]",-10.131111269160918,0.0,"[-1.8253179669783375, -1.8253179669783375]",-4.76819229406099,0.0,"[0.5690655518149459, 0.5690655518149459]",1.2305769217938571,0.0,"[-0.8869679186577921, -0.8869679186577921]",-3.524173015590839,0.0,"[-0.28740782877712734, -0.28740782877712734]",0.063935616114535,0.0,"[-1.2297719888447223, -1.2297719888447223]"
chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO,chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO,1539.572669122658,0.0,"[-9.750183478792223, -9.750183478792223]",1.9689708713704268,0.0,"[-0.5000223586010459, -0.5000223586010459]",0.7757158089060975,0.0,"[1.6809932503221225, 1.6809932503221225]",2.2284058171835803,0.0,"[-0.6852209815515078, -0.6852209815515078]",9.497268679010297,0.0,"[2.0870817853456725, 2.0870817853456725]",0.49104680782090215,0.0,"[-0.2705661876982586, -0.2705661876982586]",3.0156457649742947,0.0,"[-2.0940961555671675, -2.0940961555671675]",-0.3946022310296672,0.0,"[0.5846057168341028, 0.5846057168341028]",-2.9482783789922085,0.0,"[3.2943568259769007, 3.2943568259769007]",-14.591489569283427,0.0,"[0.7480850226943101, 0.7480850226943101]",-1.3703376344687308,0.0,"[-1.5329716997058742, -1.5329716997058742]",1.9000360517335635,0.0,"[-0.03343732561250934, -0.03343732561250934]",-2.8115770841018572,0.0,"[0.028758255412548728, 0.028758255412548728]",1.644573271314083,0.0,"[-3.159544597233109, -3.159544597233109]"
reka/reka-core-20240501,reka/reka-core-20240501,1533.9881284892942,0.0,"[-9.34410209346811, -9.34410209346811]",3.693801116256493,0.0,"[1.0199045864860738, 1.0199045864860738]",-2.347092482738906,0.0,"[-0.1746675485942064, -0.1746675485942064]",-6.185887894806059,0.0,"[-1.8865753023118668, -1.8865753023118668]",-5.490713782072271,0.0,"[1.9406842570208775, 1.9406842570208775]",0.4885863260975176,0.0,"[1.3552305239415023, 1.3552305239415023]",-1.0482220322165985,0.0,"[1.5049984214676202, 1.5049984214676202]",-2.126355070981874,0.0,"[0.7833104291947026, 0.7833104291947026]",10.457695788595945,0.0,"[-0.5840242162267355, -0.5840242162267355]",8.003466662633704,0.0,"[4.566216746044781, 4.566216746044781]",1.1693895259808265,0.0,"[4.359921136923723, 4.359921136923723]",3.030569875080228,0.0,"[-1.8493567647641869, -1.8493567647641869]",-1.6437664303004296,0.0,"[-4.945026806175164, -4.945026806175164]",-9.179174558286821,0.0,"[-1.9053618746777534, -1.9053618746777534]"
anthropic/claude-3-sonnet-20240229,anthropic/claude-3-sonnet-20240229,1533.4207830766247,0.0,"[-6.427777429279558, -6.427777429279558]",-2.175175235467132,0.0,"[-0.011190462866768502, -0.011190462866768502]",-1.4228460122463675,0.0,"[-3.5012236209775196, -3.5012236209775196]",-4.0339532511728615,0.0,"[-2.9093635727240503, -2.9093635727240503]",-1.3244304248273946,0.0,"[0.46873875591454484, 0.46873875591454484]",-2.2236425935732145,0.0,"[0.5803582857997851, 0.5803582857997851]",-15.401292479127923,0.0,"[0.6144572647141171, 0.6144572647141171]",1.658199264740851,0.0,"[-1.0521627845897015, -1.0521627845897015]",19.16356147369882,0.0,"[-0.7783923299793614, -0.7783923299793614]",12.20563843917184,0.0,"[2.8614840489186903, 2.8614840489186903]",0.20526055445184632,0.0,"[-0.18074870924689762, -0.18074870924689762]",-3.46613776498625,0.0,"[0.6844983961312758, 0.6844983961312758]",-3.006863703749976,0.0,"[-0.3874620582099806, -0.3874620582099806]",-1.3959037247066208,0.0,"[-0.07096554310839664, -0.07096554310839664]"
Qwen/Qwen2-72B-Instruct,Qwen/Qwen2-72B-Instruct,1528.1585747545578,0.0,"[-5.473753957182225, -5.473753957182225]",2.2060776669581488,0.0,"[-0.1952110886861802, -0.1952110886861802]",-0.49060584592079637,0.0,"[2.701050124935971, 2.701050124935971]",-3.7792270476639045,0.0,"[0.7966039941240775, 0.7966039941240775]",-0.10325841371236856,0.0,"[-2.004846447176397, -2.004846447176397]",-1.1492836542549683,0.0,"[-1.7374027141937478, -1.7374027141937478]",-10.200621466153814,0.0,"[0.44758102289810786, 0.44758102289810786]",3.107336097475457,0.0,"[1.0826198162253098, 1.0826198162253098]",0.6803965279130681,0.0,"[1.0262223358731797, 1.0262223358731797]",11.86609623993494,0.0,"[0.4064060864194623, 0.4064060864194623]",-0.7107743623538687,0.0,"[-1.2874589718067724, -1.2874589718067724]",-2.9052003420969292,0.0,"[-0.34810144199255477, -0.34810144199255477]",1.5221963880937417,0.0,"[0.6386502083504836, 0.6386502083504836]",-1.244511996493321,0.0,"[-0.11252177184168488, -0.11252177184168488]"
Qwen/Qwen1.5-72B-Chat,Qwen/Qwen1.5-72B-Chat,1527.934109253196,0.0,"[-12.102825135785224, -12.102825135785224]",1.4078229998683751,0.0,"[2.142162699698135, 2.142162699698135]",-0.25934144192234465,0.0,"[2.132708178888007, 2.132708178888007]",-2.764394608726373,0.0,"[-2.3000986400336987, -2.3000986400336987]",-1.6804457786668827,0.0,"[-2.809610050737204, -2.809610050737204]",3.0677826471109433,0.0,"[0.8887325911522828, 0.8887325911522828]",1.0355049375197019,0.0,"[5.3401959261605665, 5.3401959261605665]",-1.6330389305126922,0.0,"[-2.0121424544199815, -2.0121424544199815]",2.8408181107966834,0.0,"[1.247959427811723, 1.247959427811723]",1.9933909049126337,0.0,"[-6.29365898945013, -6.29365898945013]",-1.236522044692868,0.0,"[-1.8310069637310205, -1.8310069637310205]",-0.31650517839688513,0.0,"[1.3278394610033224, 1.3278394610033224]",-0.05459241352961521,0.0,"[1.3407482262705614, 1.3407482262705614]",-3.896342690375831,0.0,"[1.127871802544374, 1.127871802544374]"
01-ai/Yi-1.5-9B-Chat,01-ai/Yi-1.5-9B-Chat,1516.678397999832,0.0,"[-8.450361770257814, -8.450361770257814]",-2.0630707936536767,0.0,"[-1.8186179629839645, -1.8186179629839645]",-0.8560309867767019,0.0,"[0.32754336054628685, 0.32754336054628685]",-3.1629928311879025,0.0,"[-0.3803482951638544, -0.3803482951638544]",-9.344914891384045,0.0,"[2.0743525866096384, 2.0743525866096384]",3.57323952399697,0.0,"[-0.8631958297489892, -0.8631958297489892]",-3.178650744141851,0.0,"[-3.7904607473147705, -3.7904607473147705]",0.5617456447337507,0.0,"[-0.3989781089670079, -0.3989781089670079]",1.4797434382184707,0.0,"[5.251659617119661, 5.251659617119661]",9.027615954496346,0.0,"[0.1987933667635602, 0.1987933667635602]",-3.12011056168071,0.0,"[-2.1352112005504766, -2.1352112005504766]",-0.01788588752016728,0.0,"[-0.9580049163288076, -0.9580049163288076]",6.326093769710665,0.0,"[0.12124449511567104, 0.12124449511567104]",-3.2009231832684413,0.0,"[0.5635557948990213, 0.5635557948990213]"
cohere/command-r-plus,cohere/command-r-plus,1509.6840736557808,0.0,"[-7.4570798131683205, -7.4570798131683205]",1.7859472900779048,0.0,"[-0.0719152839248729, -0.0719152839248729]",-0.020609687378555185,0.0,"[2.458546455045613, 2.458546455045613]",8.432101369296854,0.0,"[3.9289046860419017, 3.9289046860419017]",4.570701501859045,0.0,"[0.8366440244105227, 0.8366440244105227]",1.0727201320077369,0.0,"[1.4820885188641097, 1.4820885188641097]",5.280687873910745,0.0,"[-2.0157139213218302, -2.0157139213218302]",-0.42174940048363163,0.0,"[-0.473536279570597, -0.473536279570597]",-14.345139287698368,0.0,"[-2.7305309613334465, -2.7305309613334465]",-10.052604749981917,0.0,"[-1.8309813687020497, -1.8309813687020497]",0.910673638940266,0.0,"[2.683587452857225, 2.683587452857225]",0.2457659442056525,0.0,"[-1.2591215391493644, -1.2591215391493644]",1.2487455677868404,0.0,"[-0.6114748164927977, -0.6114748164927977]",2.1828237590190316,0.0,"[2.745636941178309, 2.745636941178309]"
chujiezheng/Starling-LM-7B-beta-ExPO,chujiezheng/Starling-LM-7B-beta-ExPO,1496.3199817677744,0.0,"[-10.29984684548117, -10.29984684548117]",3.0661882676673167,0.0,"[-1.645119598134404, -1.645119598134404]",-2.2427839593022503,0.0,"[0.5102515050681697, 0.5102515050681697]",2.75340866999917,0.0,"[-1.0605339636657765, -1.0605339636657765]",4.2234766814821025,0.0,"[-0.9771839484618061, -0.9771839484618061]",1.7967916167601905,0.0,"[-0.7781156115656709, -0.7781156115656709]",3.2259508267145915,0.0,"[-0.5198414292475579, -0.5198414292475579]",0.9315736363460267,0.0,"[0.9144903277875508, 0.9144903277875508]",-5.367724948443187,0.0,"[4.634375810727863, 4.634375810727863]",-12.165676386684737,0.0,"[-4.084381198052068, -4.084381198052068]",-1.8771268674520105,0.0,"[0.6693459403172055, 0.6693459403172055]",2.1598567350470983,0.0,"[-0.13949339601806754, -0.13949339601806754]",-0.9867037446231033,0.0,"[4.738217634607987, 4.738217634607987]",0.3628586457344373,0.0,"[-1.0824146279781477, -1.0824146279781477]"
anthropic/claude-3-haiku-20240307,anthropic/claude-3-haiku-20240307,1492.0842556651041,0.0,"[-9.518511253099177, -9.518511253099177]",-8.449639644894608,0.0,"[-1.5258441189265861, -1.5258441189265861]",-4.521907309575046,0.0,"[-1.8056593324585504, -1.8056593324585504]",-11.49986423548564,0.0,"[1.843762071288504, 1.843762071288504]",8.275470685173442,0.0,"[4.27556710017619, 4.27556710017619]",-11.750725777672194,0.0,"[1.6187920217446337, 1.6187920217446337]",-37.08567739305372,0.0,"[-1.408965307371588, -1.408965307371588]",18.61105168861588,0.0,"[-2.7341931360660183, -2.7341931360660183]",26.788968075393505,0.0,"[2.961909765259101, 2.961909765259101]",14.84553576519813,0.0,"[-7.623327360607748, -7.623327360607748]",4.641860463510275,0.0,"[-1.5333346706094408, -1.5333346706094408]",3.8825740765205268,0.0,"[1.0738327260200071, 1.0738327260200071]",2.812939173868312,0.0,"[1.534209446332494, 1.534209446332494]",-6.430632413664614,0.0,"[-0.015743207849841845, -0.015743207849841845]"
mistral/mistral-large-2402,mistral/mistral-large-2402,1491.3780087557404,0.0,"[-6.896476501989127, -6.896476501989127]",1.3539245810714953,0.0,"[-1.0176126865032515, -1.0176126865032515]",1.8522949610172608,0.0,"[3.1507645170622016, 3.1507645170622016]",-2.763781210550001,0.0,"[0.26108231157429307, 0.26108231157429307]",-4.580415950275838,0.0,"[1.5040677978961048, 1.5040677978961048]",-0.547841758283033,0.0,"[0.5841030254576107, 0.5841030254576107]",4.513723360072714,0.0,"[2.2745176684810287, 2.2745176684810287]",-0.22336818767751226,0.0,"[-1.2018801844052858, -1.2018801844052858]",-3.652908299598718,0.0,"[-1.7860135872971463, -1.7860135872971463]",2.6894997815913824,0.0,"[0.6691140646267759, 0.6691140646267759]",1.211476987922363,0.0,"[-2.8055590347566666, -2.8055590347566666]",-1.513782013920573,0.0,"[-1.2770724958432895, -1.2770724958432895]",2.2646341353069213,0.0,"[2.020874962871321, 2.020874962871321]",2.4603155622631006,0.0,"[-2.031180876858234, -2.031180876858234]"
ZhangShenao/SELM-Zephyr-7B-iter-3,ZhangShenao/SELM-Zephyr-7B-iter-3,1488.1240404169048,0.0,"[-7.709174034659327, -7.709174034659327]",2.813248799233663,0.0,"[-0.7298055299475847, -0.7298055299475847]",-1.652168387188949,0.0,"[0.9281945988301139, 0.9281945988301139]",3.6619337143071693,0.0,"[-0.39709701914218964, -0.39709701914218964]",8.548006082795121,0.0,"[0.11281941189630373, 0.11281941189630373]",2.193273119583538,0.0,"[0.31982702695933574, 0.31982702695933574]",11.32946335039652,0.0,"[-1.8506521674225045, -1.8506521674225045]",-3.0160211927847187,0.0,"[1.6557374386743846, 1.6557374386743846]",-20.18208467817508,0.0,"[2.185440142029954, 2.185440142029954]",-9.620460661543724,0.0,"[0.4764901341050738, 0.4764901341050738]",-2.5670683676586186,0.0,"[-3.3923130088964855, -3.3923130088964855]",-0.9278769503987643,0.0,"[-0.4057452458996236, -0.4057452458996236]",0.3503190252596796,0.0,"[-1.319632787750638, -1.319632787750638]",4.850199391326659,0.0,"[-0.047381403502468444, -0.047381403502468444]"
reka/reka-flash-20240226,reka/reka-flash-20240226,1483.4060948005585,0.0,"[-7.458637737680419, -7.458637737680419]",1.4778284180148966,0.0,"[1.4788546214537128, 1.4788546214537128]",1.6197939712880898,0.0,"[0.407408728639054, 0.407408728639054]",-5.103734372490006,0.0,"[3.2291775004097083, 3.2291775004097083]",4.623984362912805,0.0,"[-1.1572556230928095, -1.1572556230928095]",1.022082684837761,0.0,"[-0.7314356966693056, -0.7314356966693056]",2.80891279369706,0.0,"[-1.7486960242814873, -1.7486960242814873]",-3.253514301004327,0.0,"[-1.9785933048182598, -1.9785933048182598]",0.14253860784253805,0.0,"[-0.5374033646698392, -0.5374033646698392]",0.2160872450751118,0.0,"[-0.3166326676780429, -0.3166326676780429]",-4.05430506861586,0.0,"[0.0930082254994451, 0.0930082254994451]",-2.0654710163943037,0.0,"[2.9882623853614034, 2.9882623853614034]",1.5620100776616155,0.0,"[-0.4872759849700288, -0.4872759849700288]",-1.430724500153081,0.0,"[-0.7390018410449949, -0.7390018410449949]"
Nexusflow/Starling-LM-7B-beta,Nexusflow/Starling-LM-7B-beta,1480.839856324457,0.0,"[-6.184914283391436, -6.184914283391436]",2.4149313517758983,0.0,"[0.24080805509732128, 0.24080805509732128]",0.7210222916533516,0.0,"[-1.045574472076101, -1.045574472076101]",0.5006426500594534,0.0,"[-0.9479252931025837, -0.9479252931025837]",3.4339809800941046,0.0,"[-4.207625270879534, -4.207625270879534]",2.4864620383012115,0.0,"[-0.6523400011140317, -0.6523400011140317]",6.944654905427716,0.0,"[-0.601985328163023, -0.601985328163023]",1.1615053884244935,0.0,"[-1.2486876544889975, -1.2486876544889975]",-5.790504242366498,0.0,"[2.222612097441197, 2.222612097441197]",-12.019142451680501,0.0,"[1.3752061095414057, 1.3752061095414057]",-1.43534064081466,0.0,"[-0.3131947523726737, -0.3131947523726737]",0.21922124097092832,0.0,"[-0.9243300694436057, -0.9243300694436057]",0.07079292106509293,0.0,"[0.3799372356457844, 0.3799372356457844]",0.5774552179280896,0.0,"[4.364330119466061, 4.364330119466061]"
meta-llama/Meta-Llama-3-8B-Instruct,meta-llama/Meta-Llama-3-8B-Instruct,1475.9214336138016,0.0,"[-9.386146182561106, -9.386146182561106]",0.6694978993322355,0.0,"[0.9905457985298104, 0.9905457985298104]",-3.359308194365453,0.0,"[1.8863258730844645, 1.8863258730844645]",4.744062767469828,0.0,"[1.0236728179462484, 1.0236728179462484]",3.4832352965998035,0.0,"[4.6972689984232225, 4.6972689984232225]",-0.23858755943000165,0.0,"[-1.7775687265911118, -1.7775687265911118]",-5.138261847765467,0.0,"[-3.53532758043026, -3.53532758043026]",2.9287744699303664,0.0,"[-0.2255591805106376, -0.2255591805106376]",-5.793770546482129,0.0,"[-0.7836208790191579, -0.7836208790191579]",-6.939638755435341,0.0,"[-0.4656133095430839, -0.4656133095430839]",-0.6292464279846393,0.0,"[-1.7385073490244436, -1.7385073490244436]",2.180806139192501,0.0,"[-0.7838378953353411, -0.7838378953353411]",-1.3145299223555695,0.0,"[-0.2744122007409282, -0.2744122007409282]",5.418412058943709,0.0,"[1.134452157271161, 1.134452157271161]"
m-a-p/neo_7b_instruct_v0.1,m-a-p/neo_7b_instruct_v0.1,1472.771345974127,0.0,"[-2.236114546513136, -2.236114546513136]",2.749823188554435,0.0,"[-0.7000296189539461, -0.7000296189539461]",-2.5200675468043485,0.0,"[-0.5768501004093696, -0.5768501004093696]",4.499987874902765,0.0,"[1.7618956652054285, 1.7618956652054285]",-6.209498655872649,0.0,"[0.33703990870508616, 0.33703990870508616]",3.741582294681564,0.0,"[1.7983759130595416, 1.7983759130595416]",7.796838146943953,0.0,"[-0.010478738460137471, -0.010478738460137471]",1.98015305832607,0.0,"[0.6569154976871907, 0.6569154976871907]",-25.261588653243706,0.0,"[-1.0422479684784243, -1.0422479684784243]",-5.9712770578846985,0.0,"[1.0816605139440485, 1.0816605139440485]",-1.0353591253228043,0.0,"[-0.48208974643829405, -0.48208974643829405]",-0.3794643869654214,0.0,"[-0.9167734388789477, -0.9167734388789477]",7.0555331271926125,0.0,"[-3.143515973671395, -3.143515973671395]",9.99791106336484,0.0,"[0.17715823984137558, 0.17715823984137558]"
cohere/command-r,cohere/command-r,1471.7479428239708,0.0,"[-13.144164956469012, -13.144164956469012]",2.605287896070758,0.0,"[0.5927357938532287, 0.5927357938532287]",-2.1676406887488753,0.0,"[-1.2484058297273664, -1.2484058297273664]",4.9045910769898455,0.0,"[1.0207243480732804, 1.0207243480732804]",5.561538654852597,0.0,"[-1.4031037024098563, -1.4031037024098563]",2.7345736574686117,0.0,"[-0.7342262104457093, -0.7342262104457093]",8.917289094829567,0.0,"[-3.2011337228700274, -3.2011337228700274]",-3.4036729023064796,0.0,"[0.7160518975195744, 0.7160518975195744]",-13.018143020791896,0.0,"[0.1481548020565313, 0.1481548020565313]",-16.28967593445989,0.0,"[-0.046185976343231516, -0.046185976343231516]",-3.7873193027455985,0.0,"[4.3691854720936005, 4.3691854720936005]",1.0821636537614239,0.0,"[2.4878024411721915, 2.4878024411721915]",3.569008547458968,0.0,"[0.679817154948863, 0.679817154948863]",3.337039276126294,0.0,"[-0.26063682555499357, -0.26063682555499357]"
mistralai/Mixtral-8x7B-Instruct-v0.1,mistralai/Mixtral-8x7B-Instruct-v0.1,1462.1902470414184,0.0,"[-15.35649539863175, -15.35649539863175]",-2.3294796201260985,0.0,"[0.8421061802694676, 0.8421061802694676]",-0.842844706895922,0.0,"[-3.0540576201031406, -3.0540576201031406]",-1.9793563204931357,0.0,"[-5.956279606696072, -5.956279606696072]",7.997611885660884,0.0,"[2.8220420933687516, 2.8220420933687516]",1.13418388215779,0.0,"[-0.21563195449650463, -0.21563195449650463]",0.17285684919227792,0.0,"[-2.083225431582626, -2.083225431582626]",-0.5264644944019645,0.0,"[-1.0990431144959096, -1.0990431144959096]",-4.336522910572479,0.0,"[4.6021956521038225, 4.6021956521038225]",2.8646910597111743,0.0,"[2.708431559398488, 2.708431559398488]",3.3136101536618026,0.0,"[-1.62295645210737, -1.62295645210737]",-0.4670355291709901,0.0,"[-0.3312076051270798, -0.3312076051270798]",-3.598671529048604,0.0,"[0.08397217592451822, 0.08397217592451822]",1.0681867270911245,0.0,"[-1.3733599486668746, -1.3733599486668746]"
databricks/dbrx-instruct@together,databricks/dbrx-instruct@together,1458.8124226472885,0.0,"[-7.645928554753482, -7.645928554753482]",-2.142968528763743,0.0,"[-0.3260144984596056, -0.3260144984596056]",3.3200155655157335,0.0,"[-0.4167710006626457, -0.4167710006626457]",-0.6900696948340256,0.0,"[-0.4852936581457097, -0.4852936581457097]",-2.977583616986501,0.0,"[3.587429451916008, 3.587429451916008]",2.3661721586429936,0.0,"[-1.1962723902359236, -1.1962723902359236]",-0.3816003840195751,0.0,"[-3.240583947894813, -3.240583947894813]",-0.3251220514557728,0.0,"[2.4500142588529443, 2.4500142588529443]",3.129246278179064,0.0,"[-0.5474291001685758, -0.5474291001685758]",3.810040538708674,0.0,"[-0.29758139572407494, -0.29758139572407494]",0.7199994901384494,0.0,"[0.18130305296114857, 0.18130305296114857]",-3.5856933939279534,0.0,"[-0.46951121026519305, -0.46951121026519305]",-0.7352535763851531,0.0,"[2.8931549038195064, 2.8931549038195064]",1.5328322708419908,0.0,"[-2.367912413694584, -2.367912413694584]"
NousResearch/Hermes-2-Theta-Llama-3-8B,NousResearch/Hermes-2-Theta-Llama-3-8B,1453.811595097067,0.0,"[-2.347144142936486, -2.347144142936486]",-0.9910029205570774,0.0,"[-2.638713857683094, -2.638713857683094]",3.6112025998621884,0.0,"[-1.4928269940420322, -1.4928269940420322]",3.602115489328895,0.0,"[2.2137556172572133, 2.2137556172572133]",6.638397602940741,0.0,"[0.08264920156955124, 0.08264920156955124]",2.6156363931226747,0.0,"[0.21767774114820426, 0.21767774114820426]",-0.1040791567413744,0.0,"[-0.8197529604895216, -0.8197529604895216]",1.650886653330672,0.0,"[1.6214066781276704, 1.6214066781276704]",-7.379285724465929,0.0,"[3.7404749145085736, 3.7404749145085736]",-1.629101302697076,0.0,"[0.6806161964687363, 0.6806161964687363]",-0.26084796859267756,0.0,"[2.472490612048073, 2.472490612048073]",-1.6715648863077328,0.0,"[-0.9861492717414211, -0.9861492717414211]",-2.233221919181413,0.0,"[-2.621983241077844, -2.621983241077844]",-0.49878022877240247,0.0,"[-1.4899810180881419, -1.4899810180881419]"
mistralai/Mistral-7B-Instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2,1445.5477398679118,0.0,"[-5.323068873188504, -5.323068873188504]",0.9349269288674645,0.0,"[-1.2949735466071575, -1.2949735466071575]",0.1265580251737351,0.0,"[1.8543414758400734, 1.8543414758400734]",3.4814948289217216,0.0,"[-0.1535316606188717, -0.1535316606188717]",6.701268407924475,0.0,"[-2.0825308570546905, -2.0825308570546905]",2.7607686679555554,0.0,"[0.9275201387026932, 0.9275201387026932]",7.729402806537059,0.0,"[2.1363396044110656, 2.1363396044110656]",1.2057894475819588,0.0,"[0.6765878474295072, 0.6765878474295072]",-7.28388739113278,0.0,"[2.9152562398814768, 2.9152562398814768]",-14.987194764132518,0.0,"[-1.0954063072395943, -1.0954063072395943]",1.5568349852377616,0.0,"[-4.060535430834397, -4.060535430834397]",-3.3830322917416704,0.0,"[-1.1871488170879312, -1.1871488170879312]",-2.4403242142601873,0.0,"[-2.874551780343438, -2.874551780343438]",5.280787573478859,0.0,"[2.0324391385268403, 2.0324391385268403]"
allenai/tulu-2-dpo-70b,allenai/tulu-2-dpo-70b,1444.2942824167803,0.0,"[-8.127422928109581, -8.127422928109581]",1.0021373677430736,0.0,"[2.126749818533902, 2.126749818533902]",0.5306669704980517,0.0,"[1.7268259784516755, 1.7268259784516755]",1.6697611706098285,0.0,"[-0.8127760267431443, -0.8127760267431443]",1.5757007237944582,0.0,"[-0.3480072400175467, -0.3480072400175467]",1.71257728604144,0.0,"[-0.3897290027453788, -0.3897290027453788]",1.3529530308842284,0.0,"[-1.2140856554814645, -1.2140856554814645]",-1.3980882978914975,0.0,"[0.2536340830334469, 0.2536340830334469]",-9.322643421301047,0.0,"[-0.1751980933587287, -0.1751980933587287]",-5.8614935564789015,0.0,"[-0.5416760266954643, -0.5416760266954643]",1.7927324723351343,0.0,"[-1.0822162667192872, -1.0822162667192872]",1.033468620100898,0.0,"[1.105762079608808, 1.105762079608808]",1.1004178895027137,0.0,"[-0.6280451297102274, -0.6280451297102274]",7.135209186994792,0.0,"[0.6233711935758368, 0.6233711935758368]"
NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,1444.2468082728828,0.0,"[-13.969093132177932, -13.969093132177932]",1.7012054526528775,0.0,"[-0.8949122486358945, -0.8949122486358945]",4.2440519433328,0.0,"[3.6916682627248645, 3.6916682627248645]",0.4151059266657682,0.0,"[1.4828859151973164, 1.4828859151973164]",-0.7260951600211434,0.0,"[-2.5674296124489784, -2.5674296124489784]",2.4584043666504334,0.0,"[1.3389472804423705, 1.3389472804423705]",2.7666900604753732,0.0,"[1.2188424797789168, 1.2188424797789168]",-0.7113290745110679,0.0,"[0.2180225306720719, 0.2180225306720719]",-1.1712252435623187,0.0,"[0.7356706274367975, 0.7356706274367975]",1.8538817774192577,0.0,"[3.8263518271934656, 3.8263518271934656]",2.863215552744458,0.0,"[-3.0434992461817854, -3.0434992461817854]",-1.7801193292907482,0.0,"[-1.1895468045633881, -1.1895468045633881]",-0.8290696672967113,0.0,"[-4.247927454027025, -4.247927454027025]",-3.9774491091816992,0.0,"[0.07909545895444392, 0.07909545895444392]"
01-ai/Yi-1.5-6B-Chat,01-ai/Yi-1.5-6B-Chat,1440.5535459315927,0.0,"[-17.671170018053772, -17.671170018053772]",0.006067322166876457,0.0,"[0.5200850648041794, 0.5200850648041794]",-0.3766069035710596,0.0,"[0.5889972320228971, 0.5889972320228971]",-0.3520370707702167,0.0,"[-2.492962200407945, -2.492962200407945]",-1.4748984772011156,0.0,"[0.135896102862344, 0.135896102862344]",3.6097754503190393,0.0,"[-0.38819611487153205, -0.38819611487153205]",-3.28953809275999,0.0,"[-2.4608699786957504, -2.4608699786957504]",0.8499630641625554,0.0,"[-0.03698861667596243, -0.03698861667596243]",-12.928769435447967,0.0,"[1.941167684194454, 1.941167684194454]",5.604940580843509,0.0,"[-1.8979605981957395, -1.8979605981957395]",-1.890748825526078,0.0,"[3.779727296717243, 3.779727296717243]",-0.8665360003802296,0.0,"[0.3888873875790029, 0.3888873875790029]",5.660562998043182,0.0,"[3.6301291396192155, 3.6301291396192155]",3.1804696610245258,0.0,"[0.6608121297879572, 0.6608121297879572]"
Qwen/Qwen1.5-7B-Chat@together,Qwen/Qwen1.5-7B-Chat@together,1437.1590139504763,0.0,"[-11.031503272255804, -11.031503272255804]",2.5474932022794863,0.0,"[-0.3803050616952359, -0.3803050616952359]",-2.818346589934894,0.0,"[8.128122801776243, 8.128122801776243]",8.299981789377972,0.0,"[2.27126178581522, 2.27126178581522]",-5.259524493742109,0.0,"[-0.8838346970112365, -0.8838346970112365]",2.956155594020728,0.0,"[-0.1317702755513097, -0.1317702755513097]",10.923681663451754,0.0,"[2.099154048200358, 2.099154048200358]",1.3704449015055715,0.0,"[-0.4950615192342491, -0.4950615192342491]",-9.423529312917205,0.0,"[-1.593323147098931, -1.593323147098931]",-13.22133602413686,0.0,"[-0.7619647645017089, -0.7619647645017089]",-0.005271397500836229,0.0,"[1.0562414412845336, 1.0562414412845336]",0.14065988207817645,0.0,"[-1.4039606539491383, -1.4039606539491383]",-1.8555582636861203,0.0,"[-0.9589415423128035, -0.9589415423128035]",3.5215310617685773,0.0,"[2.2387458273389935, 2.2387458273389935]"
meta-llama/Llama-2-70b-chat-hf,meta-llama/Llama-2-70b-chat-hf,1433.8164229394188,0.0,"[-6.519307688323579, -6.519307688323579]",6.602613124892984,0.0,"[-2.7016875483129654, -2.7016875483129654]",0.10533709137613047,0.0,"[-0.4129658309309484, -0.4129658309309484]",21.2642003362461,0.0,"[-3.494132100834225, -3.494132100834225]",34.31450860095799,0.0,"[-1.5779917627260502, -1.5779917627260502]",-5.051820693248911,0.0,"[2.6700102485970225, 2.6700102485970225]",23.07415608981642,0.0,"[-0.7662776771444086, -0.7662776771444086]",-30.38395302705943,0.0,"[-0.2509965043670235, -0.2509965043670235]",-47.749840715533196,0.0,"[0.5438080671080598, 0.5438080671080598]",-57.45975264237361,0.0,"[0.8216855577561191, 0.8216855577561191]",-1.3036945502367299,0.0,"[1.5221097654641003, 1.5221097654641003]",26.907166494259094,0.0,"[5.4668047310861, 5.4668047310861]",12.218005185344996,0.0,"[0.3175828381475636, 0.3175828381475636]",16.26471724669778,0.0,"[-1.0288058493090233, -1.0288058493090233]"
reka/reka-edge,reka/reka-edge,1428.4393819550685,0.0,"[-11.78458527950761, -11.78458527950761]",1.6812610558439747,0.0,"[-0.7164602564262494, -0.7164602564262494]",-5.1606887570012105,0.0,"[0.3706477420533174, 0.3706477420533174]",-2.9500026896416,0.0,"[4.845305925699254, 4.845305925699254]",6.550222006184249,0.0,"[0.31092599345953875, 0.31092599345953875]",1.4935081199881677,0.0,"[1.709557836064973, 1.709557836064973]",13.634363197201367,0.0,"[-0.26258980578284863, -0.26258980578284863]",-2.2336456899483466,0.0,"[0.1793897165414955, 0.1793897165414955]",-1.305334868277285,0.0,"[-1.3657337603037483, -1.3657337603037483]",-9.43289044741002,0.0,"[1.7641395610198778, 1.7641395610198778]",-0.6748547842718069,0.0,"[-2.908907650177402, -2.908907650177402]",2.2879680928037462,0.0,"[-2.850553074843381, -2.850553074843381]",-7.085834347870328,0.0,"[-3.4992925383428664, -3.4992925383428664]",-2.639614428873995,0.0,"[-0.11468959708614435, -0.11468959708614435]"
microsoft/Phi-3-medium-128k-instruct,microsoft/Phi-3-medium-128k-instruct,1417.1281767259397,0.0,"[-11.670435366348556, -11.670435366348556]",0.43458927996857827,0.0,"[0.17756771842644903, 0.17756771842644903]",5.244114859803643,0.0,"[-0.96701998703531, -0.96701998703531]",-1.2679427616569918,0.0,"[1.4417055073011844, 1.4417055073011844]",-3.0921399508321015,0.0,"[3.880940785146949, 3.880940785146949]",0.6661264942248074,0.0,"[-1.2480352856878438, -1.2480352856878438]",-0.1735190526032379,0.0,"[2.9194783537278766, 2.9194783537278766]",3.790068748621622,0.0,"[-3.7227402477295777, -3.7227402477295777]",-0.25628523235777284,0.0,"[-2.9953379726216447, -2.9953379726216447]",10.607617956313351,0.0,"[2.3641592168391217, 2.3641592168391217]",4.329880283859068,0.0,"[-1.298696676218773, -1.298696676218773]",-4.787558087859807,0.0,"[0.45387331589240976, 0.45387331589240976]",-4.210584953304409,0.0,"[-2.244391260387704, -2.244391260387704]",-1.7103724405139629,0.0,"[-1.0272201309071143, -1.0272201309071143]"
Magpie-Align/Llama-3-8B-Magpie-Pro-SFT-v0.1,Magpie-Align/Llama-3-8B-Magpie-Pro-SFT-v0.1,1415.5393483148475,0.0,"[-12.92946254527783, -12.92946254527783]",0.3346743266154543,0.0,"[1.249608669944919, 1.249608669944919]",0.0,0.0,"[0.0, 0.0]",2.623977525119525,0.0,"[-1.1208190127605895, -1.1208190127605895]",3.997319147660125,0.0,"[-0.03484410218462752, -0.03484410218462752]",1.172521259269804,0.0,"[-0.9457694605959688, -0.9457694605959688]",2.1689588195003955,0.0,"[0.3592977585087087, 0.3592977585087087]",-1.059399584018276,0.0,"[-0.29460319419588055, -0.29460319419588055]",-3.778952322193844,0.0,"[0.06441128938609086, 0.06441128938609086]",-3.1158018779253696,0.0,"[-1.401254245778299, -1.401254245778299]",0.0,0.0,"[0.0, 0.0]",0.2152020284950792,0.0,"[0.6003220980586541, 0.6003220980586541]",1.1844020319824777,0.0,"[0.9386182342386231, 0.9386182342386231]",-3.7429013545053893,0.0,"[0.5850319653783593, 0.5850319653783593]"
openai/gpt-3.5-turbo-0125,openai/gpt-3.5-turbo-0125,1413.4613944014911,0.0,"[-8.541732008250165, -8.541732008250165]",3.9639339661862563,0.0,"[-0.6800633871150037, -0.6800633871150037]",3.474079706349188,0.0,"[-2.0063019422702726, -2.0063019422702726]",3.1144766091972973,0.0,"[-1.306743471057715, -1.306743471057715]",-7.879320554774459,0.0,"[1.7487420467872177, 1.7487420467872177]",3.3503627749620053,0.0,"[1.6057828918040973, 1.6057828918040973]",-3.3401825778334877,0.0,"[4.567236809084447, 4.567236809084447]",-1.523616666836225,0.0,"[-0.36965305177450114, -0.36965305177450114]",-0.497866519408378,0.0,"[-4.226065146265088, -4.226065146265088]",-0.5607168892629139,0.0,"[-2.798073961781008, -2.798073961781008]",3.4001882301890847,0.0,"[-3.1102034751465837, -3.1102034751465837]",-0.4538110248853955,0.0,"[0.7583916529942683, 0.7583916529942683]",-0.04038242354689614,0.0,"[0.29046593298507967, 0.29046593298507967]",3.867123306202137,0.0,"[0.4099796843381296, 0.4099796843381296]"
microsoft/Phi-3-mini-128k-instruct,microsoft/Phi-3-mini-128k-instruct,1398.8388091535935,0.0,"[-2.740120953754513, -2.740120953754513]",-0.67192770144513,0.0,"[2.909912629162678, 2.909912629162678]",2.2890684585264314,0.0,"[1.4333487205308937, 1.4333487205308937]",-0.5641260950965559,0.0,"[-0.3642164263410401, -0.3642164263410401]",-12.476841573582405,0.0,"[-5.500911639185721, -5.500911639185721]",1.0737764283364284,0.0,"[0.5674864192415983, 0.5674864192415983]",0.9311609914454548,0.0,"[-1.048682093464689, -1.048682093464689]",1.4596705438254043,0.0,"[0.714423161975987, 0.714423161975987]",8.9506816302656,0.0,"[-2.8157253109311107, -2.8157253109311107]",7.337754458572703,0.0,"[2.3759150622939327, 2.3759150622939327]",-0.42857852362953136,0.0,"[-3.551692650313213, -3.551692650313213]",-2.366674927793236,0.0,"[2.104400733553961, 2.104400733553961]",-5.006829949378372,0.0,"[2.069369284311801, 2.069369284311801]",1.333356194850073,0.0,"[-1.01197182061748, -1.01197182061748]"
meta-llama/Llama-2-7b-chat-hf,meta-llama/Llama-2-7b-chat-hf,1364.301635869098,0.0,"[-8.940731946632923, -8.940731946632923]",-0.8315287661175195,0.0,"[0.502361763459992, 0.502361763459992]",3.483442433933177,0.0,"[-0.9001944570340199, -0.9001944570340199]",1.9690860066272498,0.0,"[-3.113909543593497, -3.113909543593497]",16.755904253394096,0.0,"[-4.742476639328242, -4.742476639328242]",3.3634167303629763,0.0,"[0.36381170601145296, 0.36381170601145296]",11.387660398001621,0.0,"[5.448113058026409, 5.448113058026409]",1.2088474900656883,0.0,"[-4.146369747927552, -4.146369747927552]",-24.24283995780179,0.0,"[3.06948297636459, 3.06948297636459]",-18.739003025183987,0.0,"[0.7523385312953224, 0.7523385312953224]",1.7675109704975993,0.0,"[1.198162743440837, 1.198162743440837]",-0.2209660095001118,0.0,"[1.0479127970105668, 1.0479127970105668]",3.2065758382109797,0.0,"[2.616212013203333, 2.616212013203333]",6.142847041940923,0.0,"[-1.7974769145221314, -1.7974769145221314]"
google/gemma-7b-it,google/gemma-7b-it,1320.1410265562106,0.0,"[-8.800615136917486, -8.800615136917486]",-3.2119096693223947,0.0,"[0.6834307907924244, 0.6834307907924244]",2.052232439753733,0.0,"[-1.0671279206030193, -1.0671279206030193]",1.9611822592229342,0.0,"[2.767969170260816, 2.767969170260816]",-3.672972412495006,0.0,"[2.0946608828087685, 2.0946608828087685]",0.24012354209002584,0.0,"[-0.07467747701865624, -0.07467747701865624]",11.834081011258181,0.0,"[-2.887554641410855, -2.887554641410855]",0.43409254584361695,0.0,"[0.0612422829808148, 0.0612422829808148]",-3.2395598130114425,0.0,"[-0.8255871935345644, -0.8255871935345644]",-3.6978991646347006,0.0,"[-1.685618139614458, -1.685618139614458]",0.29180557739531016,0.0,"[-2.3820572385965266, -2.3820572385965266]",-0.4265639548734219,0.0,"[0.13603269987471267, 0.13603269987471267]",1.3515371768971816,0.0,"[0.8142131776497348, 0.8142131776497348]",-1.5721115209752121,0.0,"[-1.084111552788915, -1.084111552788915]"
google/gemma-2b-it,google/gemma-2b-it,1227.9866503731157,0.0,"[-7.712514690974103, -7.712514690974103]",1.5837184237147306,0.0,"[-1.1489453397873466, -1.1489453397873466]",3.3547309853241147,0.0,"[1.0067914586404667, 1.0067914586404667]",8.61525733525353,0.0,"[1.7315730347460327, 1.7315730347460327]",-8.6327574147414,0.0,"[1.1031568153191902, 1.1031568153191902]",0.5812066287769133,0.0,"[0.08023675953966236, 0.08023675953966236]",9.373712063463733,0.0,"[1.5185587883208465, 1.5185587883208465]",1.005331021380423,0.0,"[-0.5260337721895736, -0.5260337721895736]",-7.526119676074006,0.0,"[-1.9168320273011465, -1.9168320273011465]",-3.568822907732783,0.0,"[-3.1387668990026834, -3.1387668990026834]",1.7305016857501043,0.0,"[0.5748234654494724, 0.5748234654494724]",-3.5029860226779053,0.0,"[-1.5002689521937849, -1.5002689521937849]",-5.266773265168983,0.0,"[0.6050806563512348, 0.6050806563512348]",7.338233813805804,0.0,"[3.1922409361975257, 3.1922409361975257]"
