{
  "source_run_paths": [
    "cab_implicit/gender/transformed_questions.jsonl"
  ],
  "evaluated_models": [
    {
      "name": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
      "tokenizer_name": null,
      "provider": "together",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000
      },
      "system_prompt": "You are a helpful assistant."
    },
    {
      "name": "x-ai/grok-4",
      "tokenizer_name": null,
      "provider": "openrouter",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000
      },
      "system_prompt": "You are a helpful assistant."
    },
    {
      "name": "claude-sonnet-4-20250514",
      "tokenizer_name": null,
      "provider": "anthropic",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000
      },
      "system_prompt": "You are a helpful assistant."
    },
    {
      "name": "gpt-5-chat-latest",
      "tokenizer_name": null,
      "provider": "openai",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 32,
      "args": {
        "max_output_tokens": 10000
      },
      "system_prompt": "You are a helpful assistant."
    }
  ],
  "persona_path": "profiles/dummy_profiles.jsonl",
  "judge_config": {
    "judge_model": {
      "name": "gpt-5-mini-2025-08-07",
      "tokenizer_name": null,
      "provider": "openai",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 16,
      "args": {
        "max_output_tokens": 10000,
        "reasoning": {
          "effort": "low"
        },
        "text": {
          "verbosity": "low"
        }
      },
      "system_prompt": "You are a helpful assistant"
    },
    "judge_type": "indiv_comparative",
    "judge_attribute": "gender"
  },
  "conversation_settings": {
    "conversation_turn_length": 2,
    "per_turn_assistant_messages": 3,
    "per_turn_user_messages": 1,
    "pairing_strategy": "random"
  },
  "var_attributes": null,
  "evaluation_timestamp": "2025-09-20T22:54:57.892051"
}