trainer.nnodes: 1
trainer.n_gpus_per_node: 2
data.path: $HOME/data/math-hard/test.parquet
data.prompt_key: prompt
data.slice_start: 128
data.crop_size: 128
data.batch_size: 128
data.n_samples: 256
data.output_path: "/beegfs/scratch/user/<anonymized>/reasoning/generations/$MODEL_NAME.more_problems.parquet"
model.path: "/beegfs/scratch/user/<anonymized>/reasoning/huggingface/$MODEL_NAME"
# model.path: meta-llama/Llama-3.2-3B-Instruct
# model.path: Qwen/Qwen2.5-1.5B-Instruct
rollout.temperature: 1
rollout.top_p: 1
rollout.top_k: -1
rollout.prompt_length: 1800
rollout.response_length: 1024
rollout.tensor_model_parallel_size: 1
rollout.gpu_memory_utilization: 0.9
rollout.max_num_batched_tokens: 98304 #65536
rollout.calculate_log_probs: "true"