CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-3B/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite.jsonl \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --batch-size 8 \
  --model-tag reflogp


CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/implicit-prm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_implicitprm.json \
  --batch-size 8 \
  --model-tag rmlogp
  

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/implicit-drm-beta10-gamma5 \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_ipvrm.json \
  --batch-size 8 \
  --model-tag rmlogp

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/qrm1/checkpoint-100 \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_qrm.json \
  --batch-size 2 \
  --model_type rm3 \
  --model-tag rmlogp

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/dpo_rm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/validation_0_2048_rewrite_dpo.json \
  --batch-size 8 \
  --model-tag rmlogp















CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-3B/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite.jsonl \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --batch-size 8 \
  --model-tag reflogp


CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/implicit-prm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_implicitprm.json \
  --batch-size 2 \
  --model-tag rmlogp
  

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/implicit-drm-beta10-gamma5 \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_ipvrm.json \
  --batch-size 8 \
  --model-tag rmlogp

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/qrm1/checkpoint-600 \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_qrm.json \
  --batch-size 2 \
  --model_type rm3 \
  --model-tag rmlogp

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses_1.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/dpo_rm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/qwen3-0.6B-base/prime-sft/prime-rl-rollouts/validation_0_2048_rewrite_dpo.json \
  --batch-size 8 \
  --model-tag rmlogp