benchmark: ../benchmarks/nq.yaml
model:     ../models/o3mini.yaml