
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_ref.json \
  --batch-size 8 \
  --model-tag reflogp

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/dpo_rm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_dpo.json \
  --batch-size 8 \
  --model-tag rmlogp
  
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/implicit-drm-beta10-gamma5 \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_implicit-drm-beta10-gamma5.json \
  --batch-size 8 \
  --model-tag rmlogp
  
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/implicit-prm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_implicit-prm.json \
  --batch-size 8 \
  --model-tag rmlogp
  
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
~/verl_250713/.conda/bin/accelerate launch \
  --num_processes 8 ~/verl_250713/scripts/bon2_compute_logp_for_responses.py \
  --model-path      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/implicit-prm \
  --tokenizer-path  ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full \
  --input-json      ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_ref.json \
  --output-path     ~/LLaMA-Factory-250514/saves_shuyan/llama3.2-1B-base/prime-sft-full/prime-rl-rollouts/bo64_t05_validation_implicit-prm.json \
  --batch-size 8 \
  --model-tag rmlogp
  
  
# bash ~/verl_250713/scripts/run_250926.sh