{
  "source_run_paths": [
    "cab/gender/samples_gender.jsonl"
  ],
  "evaluated_models": [
    {
      "name": "deepseek-ai/DeepSeek-V3.1",
      "tokenizer_name": null,
      "provider": "together",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000,
        "chat_template_kwargs": {
          "thinking": false
        }
      },
      "system_prompt": "You are a helpful assistant."
    },
    {
      "name": "openai/gpt-oss-120b",
      "tokenizer_name": null,
      "provider": "together",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000,
        "reasoning_effort": "low"
      },
      "system_prompt": "You are a helpful assistant."
    },
    {
      "name": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
      "tokenizer_name": null,
      "provider": "together",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000
      },
      "system_prompt": "You are a helpful assistant."
    },
    {
      "name": "x-ai/grok-4",
      "tokenizer_name": null,
      "provider": "openrouter",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 12,
      "args": {
        "temperature": 1.0,
        "max_tokens": 1000
      },
      "system_prompt": "You are a helpful assistant."
    }
  ],
  "persona_path": "profiles/dummy_profiles.jsonl",
  "judge_config": {
    "judge_model": {
      "name": "gpt-5-mini-2025-08-07",
      "tokenizer_name": null,
      "provider": "openai",
      "dtype": "float16",
      "device": "auto",
      "max_workers": 16,
      "args": {
        "max_output_tokens": 10000,
        "reasoning": {
          "effort": "low"
        },
        "text": {
          "verbosity": "low"
        }
      },
      "system_prompt": "You are a helpful assistant"
    },
    "judge_type": "indiv_comparative",
    "judge_attribute": "gender"
  },
  "conversation_settings": {
    "conversation_turn_length": 2,
    "per_turn_assistant_messages": 3,
    "per_turn_user_messages": 1,
    "pairing_strategy": "random"
  },
  "var_attributes": null,
  "evaluation_timestamp": "2025-09-20T11:13:04.453829"
}