
CUDA_VISIBLE_DEVICES=0 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 0 --end 210 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self/math-test-contrastive_decoding_0_210.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &

CUDA_VISIBLE_DEVICES=0 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 210 --end 420 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self/math-test-contrastive_decoding_210_420.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &
    
CUDA_VISIBLE_DEVICES=2 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 420 --end 630 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self/math-test-contrastive_decoding_420_630.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &
    
CUDA_VISIBLE_DEVICES=3 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 630 --end 842 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/seq_ce_11_self/math-test-contrastive_decoding_630_842.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &




CUDA_VISIBLE_DEVICES=4 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2 \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 0 --end 210 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2/math-test-contrastive_decoding_0_210.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &
    
CUDA_VISIBLE_DEVICES=5 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2 \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 210 --end 420 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2/math-test-contrastive_decoding_210_420.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &

CUDA_VISIBLE_DEVICES=6 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2 \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 420 --end 630 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2/math-test-contrastive_decoding_420_630.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &

CUDA_VISIBLE_DEVICES=7 ~/verl_250713/.conda/bin/python \
~/verl_250713/scripts/contrastive_decoding.py \
    --expert_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2 \
    --base_model ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new \
    --data ~/LLaMA-Factory-250514/saves/qwen3-0.6B/prime-sft-new/PRIME-RL-qwen3sft-0-480000-not-exceeed-catagory5/valid.parquet \
    --prompt_key prompt \
    --output_key response \
    --begin 630 --end 842 \
    --output_jsonl ~/LLaMA-Factory-250514/saves/qwen3-0.6B/every_position_ce_11_self2/math-test-contrastive_decoding_630_842.jsonl \
    --batch_size 8 \
    --candidate_threshold 0.2 \
    --score_threshhold_value 0.2 &
    
    