name: "Sycophancy Bench (confidence estimation prompt)"
slug: "sycophancy_best_of_n"
admins:
  - "sycophancy-1"

model_configs:
- "qwen/qwen3_4b"
- "qwen/qwen3_235b_a22b"