model_name: "mistralai/Mistral-7B-v0.1"
reward_model_names: ["mistralai/Mistral-7B-v0.1"]
model_device_map: {"main": "cuda:0", "reward0": "cuda:1"}
dataset: "trivia_qa"
limit: null
output_dir: "outputs/tqa_validation_mistral_v1.jsonl"
n_generations: 3
batch_size: 1
split: "validation"
