conda info -e
nvcc -V
nvidia-smi

# python -m safe_rlhf.evaluate.model_eval \
#     --response_path ../outputdata/generate/beavertails/PPO_Lag_beavertrails_1.json \
#     --reward_model_name_or_path ../model/beaver-7b-v1.0-reward \
# 	--cost_model_name_or_path ../model/beaver-7b-v1.0-cost \
#     --output_dir ../outputdata/model_eval/beavertails/

python -m safe_rlhf.evaluate.model_eval \
    --response_path ../outputdata/generate/pku/Llama-3.2-3B-sft-alpaca-ppo-lag_1.json \
    --reward_model_name_or_path ../model/beaver-7b-v1.0-reward \
	--cost_model_name_or_path ../model/beaver-7b-v1.0-cost \
    --output_dir ../outputdata/model_eval/pku/

python -m safe_rlhf.evaluate.model_eval \
    --response_path ../outputdata/generate/safety-llama/Llama-3.2-3B-sft-alpaca-ppo-lag_1.json \
    --reward_model_name_or_path ../model/beaver-7b-v1.0-reward \
	--cost_model_name_or_path ../model/beaver-7b-v1.0-cost \
    --output_dir ../outputdata/model_eval/safety-llama/