#!/bin/bash
for i in $(seq 0 4999)
do
    echo $i
    python3 -m inference_rlhf.code.generate \
        sampling.seed=1337 \
        policy=qwen-25-05b \
        sampling.num_blocks=1 \
        user=anonymouspli \
        task=math \
        sampling.k=1024 \
        sampling.temperature=1.0 \
        sampling.top_p=1.0 \
        task.generation.generation_idx=$i \
        sampling.tensor_parallel_size=1 \
        generate.remote=True
done

# TODO: make sure to change user above with your own!
