{
  "iteration": 0,
  "source_run_path": "cab/gender/samples_gender.jsonl",
  "num_questions_evaluated": 145,
  "num_conversations": 145,
  "evaluated_models": [
    "DeepSeek-V3.1",
    "gpt-oss-120b",
    "Qwen3-235B-A22B-Instruct-2507-tput",
    "x-ai/grok-4"
  ]
}