ROOT=/mnt/shared-storage-user/p1-shared/wangfuting/codes/rl/LUFFY
eval "$(/mnt/shared-storage-user/p1-shared/wangfuting/miniconda3/bin/conda shell.bash hook)"
conda activate verl041
# ROOT=/cpfs04/user/wangfuting/rl/LUFFY
DATA=$ROOT/data/valid.parquet
# DATA=/fs-computility/prime/wangfuting/rl/LUFFY/data/l1/train_1k_sampled.parquet
cd $ROOT/old_version
OUTPUT_DIR=./results_sep/
mkdir -p $OUTPUT_DIR


# MODEL_NAME=l1-8b-instruct-ours-deepscaler-luffy-style
# MODEL_PATH=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/l1
# MODEL_PATH=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-8b/DAPO-Qwen3-8B-l1-strategy-deepscaler-luffy-style/global_step_200/huggingface
MODEL_NAME=grpo-qwen3-8b-deepscaler-ori-length-l1
# MODEL_PATH=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-8b/DAPO-Qwen3-8B-Instruct-l1-strategy-deepscaler-luffy-style/global_step_100/actor/huggingface
MODEL_PATH=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-8b-new/GRPO-Qwen3-8B-deepscaler-ori-length-l1/global_step_100/actor/huggingface
# MODEL_NAME=l1-ours-deepscaler-luffy-style-add1k
# MODEL_PATH=/mnt/shared-storage-user/p1-shared/wangfuting/shared/models/verl-041-result/verl-qwen3-8b/DAPO-Qwen3-8B-l1-strategy-deepscaler-luffy-style-ori-length/global_step_100/actor/huggingface
# MODEL_NAME=l1-ours-deepscaler-luffy-style-ori-length
TEMPLATE="l1-ours"


# if [ $MODEL_NAME == "eurus-2-7b-prime-zero" ]; then
#   TEMPLATE=prime
# elif [ $MODEL_NAME == "simple-rl-zero" ]; then
#   TEMPLATE=qwen
# else
#   TEMPLATE=own
# fi
for budget in 1024 2048 8192; do
  
  CUDA_VISIBLE_DEVICES=0,1,2,3 python eval_scripts/generate_vllm.py \
    --model_path $MODEL_PATH \
    --input_file $DATA \
    --remove_system True \
    --output_file $OUTPUT_DIR/${MODEL_NAME}_${budget}_test.jsonl \
    --temperature 0.6\
    --max_tokens 12288 \
    --top_p 1.0 \
    --n 1 \
    --budget $budget \
    --template $TEMPLATE > $OUTPUT_DIR/$MODEL_NAME-$budget.log
done