,model,Rating,Rating std,Rating alpha
openai/gpt-4-turbo-2024-04-09,openai/gpt-4-turbo-2024-04-09,1594.5007067628276,0.0,"[-1.3845635529976335, -1.3845635529976335]"
openai/gpt-4o-2024-05-13,openai/gpt-4o-2024-05-13,1592.7941301077603,0.0,"[0.04568118777683594, 0.04568118777683594]"
google/gemini-1.5-pro,google/gemini-1.5-pro,1588.0432715988545,0.0,"[-1.3237085941241276, -1.3237085941241276]"
anthropic/claude-3-opus-20240229,anthropic/claude-3-opus-20240229,1579.6324828383101,0.0,"[-1.9022803747425314, -1.9022803747425314]"
openai/gpt-4-0125-preview,openai/gpt-4-0125-preview,1572.2956264910147,0.0,"[-1.2964624257595005, -1.2964624257595005]"
meta-llama/Meta-Llama-3-70B-Instruct,meta-llama/Meta-Llama-3-70B-Instruct,1570.8311328117184,0.0,"[-4.603470192070972, -4.603470192070972]"
reka/reka-core-20240501,reka/reka-core-20240501,1559.094237592447,0.0,"[1.918626058513155, 1.918626058513155]"
google/gemini-1.5-flash,google/gemini-1.5-flash,1554.2642829212282,0.0,"[-7.594886084584232, -7.594886084584232]"
deepseek/deepseekv2-chat,deepseek/deepseekv2-chat,1551.6405999838605,0.0,"[-1.8778815428886446, -1.8778815428886446]"
yi/yi-large,yi/yi-large,1550.722406695293,0.0,"[-3.1317141477040877, -3.1317141477040877]"
anthropic/claude-3-sonnet-20240229,anthropic/claude-3-sonnet-20240229,1547.2587075268611,0.0,"[-1.163721789996771, -1.163721789996771]"
princeton-nlp/Llama-3-Instruct-8B-SimPO,princeton-nlp/Llama-3-Instruct-8B-SimPO,1546.4633825335688,0.0,"[-3.5798719258862093, -3.5798719258862093]"
chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO,chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO,1546.3030727501637,0.0,"[-1.7243867642416717, -1.7243867642416717]"
Qwen/Qwen1.5-72B-Chat,Qwen/Qwen1.5-72B-Chat,1545.2227314347178,0.0,"[-3.606090814316076, -3.606090814316076]"
01-ai/Yi-1.5-34B-Chat,01-ai/Yi-1.5-34B-Chat,1538.2909120226623,0.0,"[-5.655765944019549, -5.655765944019549]"
Qwen/Qwen2-72B-Instruct,Qwen/Qwen2-72B-Instruct,1529.9481592860868,0.0,"[1.2592812728278204, 1.2592812728278204]"
cohere/command-r-plus,cohere/command-r-plus,1515.7016914662058,0.0,"[-1.1038584071143305, -1.1038584071143305]"
anthropic/claude-3-haiku-20240307,anthropic/claude-3-haiku-20240307,1513.7742390561568,0.0,"[-2.776919019064735, -2.776919019064735]"
mistral/mistral-large-2402,mistral/mistral-large-2402,1510.9674429466431,0.0,"[-1.5407743603857398, -1.5407743603857398]"
reka/reka-flash-20240226,reka/reka-flash-20240226,1507.5443838374554,0.0,"[1.1900446473782722, 1.1900446473782722]"
01-ai/Yi-1.5-9B-Chat,01-ai/Yi-1.5-9B-Chat,1497.869370266637,0.0,"[-1.1419711312478285, -1.1419711312478285]"
chujiezheng/Starling-LM-7B-beta-ExPO,chujiezheng/Starling-LM-7B-beta-ExPO,1488.3512979414404,0.0,"[-2.156870691200311, -2.156870691200311]"
ZhangShenao/SELM-Zephyr-7B-iter-3,ZhangShenao/SELM-Zephyr-7B-iter-3,1487.7488091145638,0.0,"[-2.215647489310186, -2.215647489310186]"
mistralai/Mixtral-8x7B-Instruct-v0.1,mistralai/Mixtral-8x7B-Instruct-v0.1,1480.6446240556097,0.0,"[-9.322644117922437, -9.322644117922437]"
Nexusflow/Starling-LM-7B-beta,Nexusflow/Starling-LM-7B-beta,1480.3331784643756,0.0,"[1.082890580325511, 1.082890580325511]"
cohere/command-r,cohere/command-r,1479.90116606336,0.0,"[-4.2391276161595215, -4.2391276161595215]"
meta-llama/Meta-Llama-3-8B-Instruct,meta-llama/Meta-Llama-3-8B-Instruct,1475.4541104097575,0.0,"[-2.1122942160322964, -2.1122942160322964]"
databricks/dbrx-instruct@together,databricks/dbrx-instruct@together,1474.8373688127638,0.0,"[-0.5904986068776452, -0.5904986068776452]"
openai/gpt-3.5-turbo-0125,openai/gpt-3.5-turbo-0125,1466.3598946942855,0.0,"[-0.9651695918776113, -0.9651695918776113]"
NousResearch/Hermes-2-Theta-Llama-3-8B,NousResearch/Hermes-2-Theta-Llama-3-8B,1465.1390897740393,0.0,"[5.178773956404484, 5.178773956404484]"
NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO,1457.9356811952648,0.0,"[-5.996677248702099, -5.996677248702099]"
allenai/tulu-2-dpo-70b,allenai/tulu-2-dpo-70b,1453.5354352455047,0.0,"[-2.3215759589759273, -2.3215759589759273]"
mistralai/Mistral-7B-Instruct-v0.2,mistralai/Mistral-7B-Instruct-v0.2,1453.252221275434,0.0,"[-0.044718028876104654, -0.044718028876104654]"
Qwen/Qwen1.5-7B-Chat@together,Qwen/Qwen1.5-7B-Chat@together,1445.650931555113,0.0,"[-2.957778551226511, -2.957778551226511]"
reka/reka-edge,reka/reka-edge,1444.8144208787187,0.0,"[-4.651739260141312, -4.651739260141312]"
m-a-p/neo_7b_instruct_v0.1,m-a-p/neo_7b_instruct_v0.1,1436.8763375305823,0.0,"[3.4610794842215, 3.4610794842215]"
microsoft/Phi-3-medium-128k-instruct,microsoft/Phi-3-medium-128k-instruct,1436.8287153568438,0.0,"[-4.268850338307175, -4.268850338307175]"
meta-llama/Llama-2-70b-chat-hf,meta-llama/Llama-2-70b-chat-hf,1430.1930597288922,0.0,"[-1.033403387340286, -1.033403387340286]"
microsoft/Phi-3-mini-128k-instruct,microsoft/Phi-3-mini-128k-instruct,1427.1260268027627,0.0,"[3.6685372602403277, 3.6685372602403277]"
01-ai/Yi-1.5-6B-Chat,01-ai/Yi-1.5-6B-Chat,1424.9026022303344,0.0,"[-8.338699461996384, -8.338699461996384]"
Magpie-Align/Llama-3-8B-Magpie-Pro-SFT-v0.1,Magpie-Align/Llama-3-8B-Magpie-Pro-SFT-v0.1,1412.2895799131497,0.0,"[-1.4978958878441517, -1.4978958878441517]"
google/gemma-7b-it,google/gemma-7b-it,1369.6448044017893,0.0,"[-1.91352252807701, -1.91352252807701]"
meta-llama/Llama-2-7b-chat-hf,meta-llama/Llama-2-7b-chat-hf,1367.3790947221175,0.0,"[-3.1918426231707144, -3.1918426231707144]"
google/gemma-2b-it,google/gemma-2b-it,1292.8012449023058,0.0,"[1.4432503878158514, 1.4432503878158514]"
