conda info -e
nvcc -V
nvidia-smi

# python -m safe_rlhf.evaluate.generate \
#     --corner_model_name_or_path ../model/Llama-3.2-3B-sft-alpaca \
#     --datasets PKU-SafeRLHF/train \
#     --num_per_prompt 1 \
#     --max_length 512 \
#     --output_dir ../outputdata/generate/test/

python -m safe_rlhf.evaluate.generate \
    --corner_model_name_or_path ../output/Llama-3.2-3B-sft-alpaca-sacpo\
    --datasets safety-llama/all \
    --num_per_prompt 1 \
    --max_length 512 \
    --output_dir ../outputdata/generate/safety-llama/

python -m safe_rlhf.evaluate.generate \
    --corner_model_name_or_path ../output/Llama-3.2-3B-sft-alpaca-sacpo\
    --datasets PKU-SafeRLHF/test \
    --num_per_prompt 1 \
    --max_length 512 \
    --output_dir ../outputdata/generate/pku/

# python -m safe_rlhf.evaluate.model_eval \
#     --response_path ../outputdata/generate/pku/Llama-3.2-3B-sft-alpaca_1.json \
#     --reward_model_name_or_path ../model/beaver-7b-v1.0-reward \
# 	--cost_model_name_or_path ../model/beaver-7b-v1.0-cost \
#     --output_dir ../outputdata/model_eval/pku/

# python -m safe_rlhf.evaluate.model_eval \
#     --response_path ../outputdata/generate/safety-llama/Llama-3.2-3B-sft-alpaca_1.json \
#     --reward_model_name_or_path ../model/beaver-7b-v1.0-reward \
# 	--cost_model_name_or_path ../model/beaver-7b-v1.0-cost \
#     --output_dir ../outputdata/model_eval/safety-llama/

# python -m safe_rlhf.evaluate.generate \
#     --corner_model_name_or_path ../output/RePO_TinyLlama \
#     --datasets safety-llama/all \
#     --num_per_prompt 1 \
#     --max_length 512 \
#     --output_dir ../outputdata/generate/safety-llama/

# python -m safe_rlhf.evaluate.generate \
#     --corner_model_name_or_path ../output/RePO_TinyLlama \
#     --datasets PKU-SafeRLHF/test \
#     --num_per_prompt 1 \
#     --max_length 512 \
#     --output_dir ../outputdata/generate/pku/

# python -m safe_rlhf.evaluate.generate \
#     --corner_model_name_or_path ../output/PPO_Lag_beavertrails \
#     --datasets BeaverTrails/test \
#     --num_per_prompt 1 \
#     --max_length 512 \
#     --output_dir ../outputdata/generate/beavertails/

# python -m safe_rlhf.evaluate.generate \
#     --corner_model_name_or_path ../model/beaver-7b-v1.0 \
#     --datasets safety-llama/all \
#     --num_per_prompt 1 \
#     --max_length 512 \
#     --output_dir ../outputdata/generate/safety-llama/

# python -m safe_rlhf.evaluate.generate \
#     --corner_model_name_or_path ../output/satac_sampletag9_debug_value \
#     --datasets hh-rlhf-harmless-preference/test \
#     --num_per_prompt 1 \
#     --max_length 512 \
#     --output_dir ../outputdata/generate/hh/