benchmark: ../benchmarks/cbb.yaml
model:     ../models/phi4reasoning.yaml