[
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "gpt-3.5-turbo-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt4all-13b-snoozy",
    "model_b": "alpaca-13b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "creative_writing",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "llama-2-70b-chat",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "code_writing",
    "winner": "model_a",
    "metadata": "{'score_A': 3, 'score_B': 2}",
    "model_a": "64928524",
    "model_b": "64906628",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_a",
    "metadata": "{'score_A': 4, 'score_B': 3}",
    "model_a": "fafgm0c",
    "model_b": "faea4f3",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "code_writing",
    "winner": "model_a",
    "metadata": "{'score_A': 39, 'score_B': 7}",
    "model_a": "48688988",
    "model_b": "48688887",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "open_question",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "claude-2.1",
    "model_b": "wizardlm-70b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "open_question",
    "winner": "tie",
    "metadata": "{}",
    "model_a": "stablelm-tuned-alpha-7b",
    "model_b": "koala-13b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "explaining_general",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "claude-2.1",
    "model_b": "gpt-3.5-turbo-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "open_question",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "solar-10.7b-instruct-v1.0",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "roleplay",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-0314",
    "model_b": "claude-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_medical_advice",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "vicuna-13b",
    "model_b": "oasst-pythia-12b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "gpt-4-1106-preview",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "writing_legal_document",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "claude-2.0",
    "model_b": "claude-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_b",
    "metadata": "{'score_A': 23, 'score_B': 41}",
    "model_a": "106841",
    "model_b": "106916",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "value_judgement",
    "winner": "model_a",
    "metadata": "{'score_A': 13, 'score_B': 5}",
    "model_a": "cdbblf6",
    "model_b": "cdb9mqr",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "claude-2.1",
    "model_b": "gpt-4-0314",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "llama-2-7b-chat",
    "model_b": "claude-2.1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "value_judgement",
    "winner": "model_a",
    "metadata": "{'score_A': 9, 'score_B': 7}",
    "model_a": "gzasq7k",
    "model_b": "gzar809",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_b",
    "metadata": "{'score_A': 1, 'score_B': 3}",
    "model_a": "c3chhw4",
    "model_b": "c3ciemp",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "ranking",
    "winner": "model_a",
    "metadata": "{'score_A': 330, 'score_B': 136}",
    "model_a": "hdclk46",
    "model_b": "hdchacp",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "question_generation",
    "winner": "tie",
    "metadata": "{}",
    "model_a": "solar-10.7b-instruct-v1.0",
    "model_b": "claude-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "creative_writing",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt-4-1106-preview",
    "model_b": "claude-2.0",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "ranking",
    "winner": "model_b",
    "metadata": "{'score_A': 16, 'score_B': 49}",
    "model_a": "d6pp1ye",
    "model_b": "d6pqgkp",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "planning",
    "winner": "model_b",
    "metadata": "{'score_A': 1, 'score_B': 3}",
    "model_a": "ic3yokf",
    "model_b": "ic3zh4q",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_a",
    "metadata": "{'score_A': 79, 'score_B': 67}",
    "model_a": "gjj7s04",
    "model_b": "gji2kum",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "creative_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "claude-2.0",
    "model_b": "chatglm-6b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "brainstorming",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "chatglm-6b",
    "model_b": "claude-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_b",
    "metadata": "{'score_A': 1, 'score_B': 44}",
    "model_a": "ixjvb89",
    "model_b": "ixjyx1y",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "tie",
    "metadata": "{}",
    "model_a": "vicuna-13b",
    "model_b": "koala-13b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_a",
    "metadata": "{'score_A': 21, 'score_B': 9}",
    "model_a": "1766639",
    "model_b": "1766634",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "question_generation",
    "winner": "model_a",
    "metadata": "{'score_A': 12, 'score_B': 3}",
    "model_a": "139675",
    "model_b": "139668",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "code_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-0613",
    "model_b": "vicuna-33b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_a",
    "metadata": "{'score_A': 6, 'score_B': 4}",
    "model_a": "406071",
    "model_b": "406044",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_a",
    "metadata": "{'score_A': 8, 'score_B': 6}",
    "model_a": "2449845",
    "model_b": "2449840",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "roleplay",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-1106",
    "model_b": "vicuna-33b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "open_question",
    "winner": "model_a",
    "metadata": "{'score_A': 10, 'score_B': 1}",
    "model_a": "hg5aqxd",
    "model_b": "hg32hyx",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "analyzing_general",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-0613",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_b",
    "metadata": "{'score_A': 5, 'score_B': 9}",
    "model_a": "ibillek",
    "model_b": "ibines3",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "creative_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "claude-2.0",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_a",
    "metadata": "{'score_A': 8, 'score_B': 5}",
    "model_a": "283204",
    "model_b": "283048",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "roleplay",
    "winner": "model_a",
    "metadata": "{'score_A': 17, 'score_B': 4}",
    "model_a": "gka1em4",
    "model_b": "gk9lnjz",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "functional_writing",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gemini-pro-dev-api",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_b",
    "metadata": "{'score_A': 2, 'score_B': 4}",
    "model_a": "92386",
    "model_b": "4170267",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "koala-13b",
    "model_b": "claude-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "classification_identification",
    "winner": "tie",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-0613",
    "model_b": "llama-2-70b-chat",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_a",
    "metadata": "{'score_A': 13, 'score_B': 3}",
    "model_a": "1807926",
    "model_b": "1807921",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_a",
    "metadata": "{'score_A': 7, 'score_B': 0}",
    "model_a": "debdjsh",
    "model_b": "deb7sd4",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_a",
    "metadata": "{'score_A': 9, 'score_B': -24}",
    "model_a": "etg78zo",
    "model_b": "etg58m9",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "explaining_general",
    "winner": "model_b",
    "metadata": "{'score_A': 1, 'score_B': 6}",
    "model_a": "j0g7ieg",
    "model_b": "j0gwsd8",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "ranking",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gpt-4-0314",
    "model_b": "claude-2.1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_without_math",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "gpt-3.5-turbo-1106",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "explaining_general",
    "winner": "model_b",
    "metadata": "{'score_A': 1, 'score_B': 3}",
    "model_a": "hnfye12",
    "model_b": "hngp8hl",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "vicuna-7b",
    "model_b": "gpt-3.5-turbo-0314",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_a",
    "metadata": "{'score_A': 5, 'score_B': 4}",
    "model_a": "1137454",
    "model_b": "1137428",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "value_judgement",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "dolphin-2.2.1-mistral-7b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "explaining_general",
    "winner": "model_a",
    "metadata": "{'score_A': 5, 'score_B': 4}",
    "model_a": "62786578",
    "model_b": "59683356",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_b",
    "metadata": "{'score_A': 6, 'score_B': 7}",
    "model_a": "gdhf16g",
    "model_b": "gdhqecf",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "code_writing",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "palm-2",
    "model_b": "claude-2.0",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_b",
    "metadata": "{'score_A': 3, 'score_B': 5}",
    "model_a": "cune7ug",
    "model_b": "cuno9nv",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "vicuna-33b",
    "model_b": "claude-instant-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_without_math",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "RWKV-4-Raven-14B",
    "model_b": "vicuna-7b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "data_analysis",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gpt-4-1106-preview",
    "model_b": "gpt-3.5-turbo-1106",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "model_a",
    "metadata": "{'score_A': 49, 'score_B': 7}",
    "model_a": "e0yiwm8",
    "model_b": "e0ygwd7",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "default",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "wizardlm-70b",
    "model_b": "vicuna-13b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "claude-2.1",
    "model_b": "llama-2-13b-chat",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "default",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "llama-13b",
    "model_b": "chatglm-6b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "mpt-7b-chat",
    "model_b": "gpt-3.5-turbo-0314",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_b",
    "metadata": "{'score_A': 39, 'score_B': 86}",
    "model_a": "ikhrwgb",
    "model_b": "ikhsuoe",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "chitchat",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "claude-2.0",
    "model_b": "oasst-pythia-12b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "creative_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gpt-4-0613",
    "model_b": "chatglm2-6b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_b",
    "metadata": "{'score_A': 21, 'score_B': 67}",
    "model_a": "iie858f",
    "model_b": "iiecp3a",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "explaining_general",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "koala-13b",
    "model_b": "llama-13b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_medical_advice",
    "winner": "model_b",
    "metadata": "{'score_A': 1, 'score_B': 15}",
    "model_a": "fyjzi4q",
    "model_b": "fyk0pj2",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "explaining_general",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gemini-pro-dev-api",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_a",
    "metadata": "{'score_A': 9, 'score_B': 5}",
    "model_a": "2901334",
    "model_b": "2901280",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "functional_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-0613",
    "model_b": "zephyr-7b-alpha",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "value_judgement",
    "winner": "model_b",
    "metadata": "{'score_A': 7, 'score_B': 24}",
    "model_a": "d5dug4u",
    "model_b": "d5dvgj4",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_a",
    "metadata": "{'score_A': 3, 'score_B': 2}",
    "model_a": "evdyecp",
    "model_b": "evdxah0",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "solving_exam_question_with_math",
    "winner": "model_b",
    "metadata": "{'score_A': 5, 'score_B': 8}",
    "model_a": "1254167",
    "model_b": "1254168",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_a",
    "metadata": "{'score_A': 14, 'score_B': 2}",
    "model_a": "1989407",
    "model_b": "1986476",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "instructional_rewriting",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "mixtral-8x7b-instruct-v0.1",
    "model_b": "deepseek-llm-67b-chat",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "information_extraction",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt-4-0613",
    "model_b": "gpt-4-1106-preview",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "functional_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "wizardlm-70b",
    "model_b": "mistral-medium",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_a",
    "metadata": "{'score_A': 6, 'score_B': 4}",
    "model_a": "gj0kdgw",
    "model_b": "gj0fxmz",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "ranking",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "stablelm-tuned-alpha-7b",
    "model_b": "fastchat-t5-3b",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "functional_writing",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "gpt-4-0125-preview",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_b",
    "metadata": "{'score_A': 4, 'score_B': 41}",
    "model_a": "3030565",
    "model_b": "3030580",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_a",
    "metadata": "{'score_A': 14, 'score_B': 13}",
    "model_a": "33534",
    "model_b": "19664",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "open_question",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "palm-2",
    "model_b": "gpt-3.5-turbo-1106",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "verifying_fact",
    "winner": "model_b",
    "metadata": "{'score_A': 3, 'score_B': 14}",
    "model_a": "fwpjc6w",
    "model_b": "fwpmf0n",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "open_question",
    "winner": "model_a",
    "metadata": "{}",
    "model_a": "claude-1",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "default",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "gpt-3.5-turbo-0613",
    "model_b": "mistral-medium",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_a",
    "metadata": "{'score_A': 6, 'score_B': 1}",
    "model_a": "dv508s5",
    "model_b": "dv4zwpr",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "text_to_text_translation",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "pplx-7b-online",
    "model_b": "llama-2-70b-chat",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "recommendation",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "wizardlm-13b",
    "model_b": "llama-2-13b-chat",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "writing_legal_document",
    "winner": "model_a",
    "metadata": "{'score_A': 4, 'score_B': 3}",
    "model_a": "fuog16u",
    "model_b": "funef0s",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "math_reasoning",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "openchat-3.5",
    "model_b": "claude-instant-1",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "seeking_advice",
    "winner": "model_b",
    "metadata": "{}",
    "model_a": "claude-1",
    "model_b": "gpt-4-0613",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  },
  {
    "id": "unknown",
    "results": {},
    "scenario": "default",
    "winner": "model_b",
    "metadata": "{'score_A': 24, 'score_B': 35}",
    "model_a": "dzkpw6x",
    "model_b": "dzkwgcw",
    "api_usage": null,
    "api_error": "400, message='Bad Request', url='https://api.a4f.co/v1/chat/completions'",
    "status": "failed"
  }
]