bench_name: arena-hard-v0.1
temperature: 0.0
max_tokens: 4096
num_choices: 1
stop_token_ids:
- 2
model_list:
- mistral_instruct