Rank	model_test	Qwen2.5-0.5B-Instruct
1	gpt-4-turbo-2024-04-09	6.363369634073
2	Meta-Llama-3-70B-Instruct	6.355355448397799
3	reka-core-20240501	6.2956099894315
4	dbrx-instruct@together	6.2842513759412
5	mistral-large-2402	6.2615329603382
6	claude-3-opus-20240229	6.2595304289988
7	Meta-Llama-3-8B-Instruct	6.2413178559631
8	Llama-2-70b-chat-hf	6.2211587916021
9	claude-3-sonnet-20240229	6.185299529522
10	Llama-2-7b-chat-hf	6.100248875197599
11	gemma-7b-it	6.0107061179209005
12	gemma-2b-it	5.9265396585502
