trainer.nnodes: 1
trainer.n_gpus_per_node: 2
data.path: $HOME/data/gsm8k/test.parquet
data.prompt_key: prompt
data.crop_size: 128
data.batch_size: 128
data.n_samples: 256
data.output_path: "/beegfs/scratch/user/<anonymized>/reasoning/generations/$MODEL_NAME.parquet"
# model.path: "/beegfs/scratch/user/<anonymized>/reasoning/huggingface/$MODEL_NAME"
# model.path: meta-llama/Llama-3.2-3B-Instruct
model.path: Qwen/Qwen2.5-1.5B-Instruct
rollout.temperature: 1
rollout.top_p: 1
rollout.top_k: -1
rollout.prompt_length: 512
rollout.response_length: 512
rollout.tensor_model_parallel_size: 1
rollout.gpu_memory_utilization: 0.95
rollout.max_num_batched_tokens: 98304 #65536