#!/bin/bash
for i in $(seq 0 377)
do
    echo $i
    python3 -m inference_rlhf.code.generate \
        sampling.seed=1337 \
        policy=qwen-25-05b \
        sampling.num_blocks=1 \
        user=anonymouspli \
        task=mbpp \
        sampling.k=1024 \
        sampling.temperature=1.0 \
        sampling.top_p=1.0 \
        task.generation.generation_idx=$i \
        sampling.tensor_parallel_size=1 \
        generate.remote=True
done

# TODO: make sure to change user above with your own!

# DEBUG script
# python3 -m inference_rlhf.code.generate \
#         sampling.seed=1337 \
#         policy=qwen-25-05b \
#         sampling.num_blocks=1 \
#         user=anonymouspli \
#         task=mbpp \
#         sampling.k=10 \
#         sampling.temperature=1.0 \
#         sampling.top_p=1.0 \
#         task.generation.generation_idx=0 \
#         sampling.tensor_parallel_size=1 \
#         generate.remote=True
