cd $TAMPERING_HOME/tampering/additional/external_reward_model

export CUDA_VISIBLE_DEVICES=0

# hf download Skywork/Skywork-Reward-V2-Llama-3.1-8B
python3 label_reward.py --dataset_name hhrlhf --reward_model "Skywork/Skywork-Reward-V2-Llama-3.1-8B" --model_code skywork-llama --bias_type ai 

# hf download Skywork/Skywork-Reward-V2-Qwen3-8B
python3 label_reward.py --dataset_name hhrlhf --reward_model "Skywork/Skywork-Reward-V2-Llama-3.1-8B" --model_code skywork-qwen --bias_type ai 

# hf download LxzGordon/URM-LLaMa-3.1-8B
python3 label_reward_urm.py --dataset_name hhrlhf --reward_model "LxzGordon/URM-LLaMa-3.1-8B" --model_code urm-llama --bias_type ai

# hf download Schrieffer/Llama-SARM-4B
python3 label_reward.py --dataset_name hhrlhf --reward_model "Schrieffer/Llama-SARM-4B" --model_code sarm-llama --bias_type ai

# need to install flash-attn2
hf download nicolinho/QRM-Gemma-2-27B
python3 label_reward_qrm.py --dataset_name hhrlhf --reward_model "nicolinho/QRM-Gemma-2-27B" --model_code qrm-gemma --bias_type ai