base_model_path1=./logs_morlhf/rlhf_harmless/batch_400
# base_model_path2=./logs_morlhf/rlhf_humor/batch_400
base_model_path2=./logs_morlhf/rlhf_helpful/batch_832
reward_names="harmless,helpful"
exp_type=assistant

CUDA_VISIBLE_DEVICES=0,1,2,3 accelerate launch --main_process_port 29505 eval_rewarded_soups.py --base_model_path1 $base_model_path1 --base_model_path2 $base_model_path2 --reward_names $reward_names --exp_type ${exp_type} --wandb_name $reward_names --save_directory ./logs_rewardedsoups_${exp_type}_eval