
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
export HOME="/home/export/base/ycsc_1/1/online1//GRM-Omni/src"

ray stop --force && ray start --head --disable-usage-stats --num-cpus=24

INF_MODEL="/data//GRM-Omni-ckpt/GRM-Omni-Lang-SFT"
REFINE_MODEL="/data//hf_models/models/Qwen3-32B-AWQ"
SCORE_MODEL="/data//hf_models/models/Skywork-Reward-V2-Llama-3.1-8B"

# /home/export/base/ycsc_1/1/online1//GRM-Omni/data/testset/benchmark/language/rewardbench/chat_hard.jsonl
# /home/export/base/ycsc_1/1/online1//GRM-Omni/data/testset/benchmark/language/rewardbench/reasoning.jsonl

# python src/inference.py \
#     --inference_model $INF_MODEL \
#     --refinement_model $REFINE_MODEL \
#     --score_model $SCORE_MODEL \
#     --modality "language" \
#     --mode "criteria_meta_reward" \
#     --sampling_n 1 \
#     --batch_size 2 \
#     --workers 8 \
#     --input_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/testset/benchmark/language/rewardbench/reasoning.jsonl" \
#     --output_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/trainset/language/criteria/reasoning/"

# python src/inference.py \
#     --inference_model $INF_MODEL \
#     --refinement_model $REFINE_MODEL \
#     --score_model $SCORE_MODEL \
#     --modality "language" \
#     --mode "criteria_meta_reward" \
#     --sampling_n 1 \
#     --batch_size 2 \
#     --workers 8 \
#     --input_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/testset/benchmark/language/rewardbench/chat.jsonl" \
#     --output_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/trainset/language/criteria/chat/"

# python src/inference.py \
#     --inference_model $INF_MODEL \
#     --refinement_model $REFINE_MODEL \
#     --score_model $SCORE_MODEL \
#     --modality "language" \
#     --mode "criteria_meta_reward" \
#     --sampling_n 1 \
#     --batch_size 128 \
#     --workers 8 \
#     --input_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/testset/benchmark/language/rewardbench/chat_hard.jsonl" \
#     --output_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/trainset/language/criteria/chat_hard/"

# python src/inference.py \
#     --inference_model $INF_MODEL \
#     --refinement_model $REFINE_MODEL \
#     --score_model $SCORE_MODEL \
#     --modality "language" \
#     --mode "criteria_meta_reward" \
#     --sampling_n 1 \
#     --batch_size 128 \
#     --workers 8 \
#     --input_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/testset/benchmark/language/rewardbench/safety.jsonl" \
#     --output_dir "/home/export/base/ycsc_1/1/online1//GRM-Omni/data/trainset/language/criteria/safety/"
