
CUDA_VISIBLE_DEVICES=0 NCCL_P2P_DISABLE=1 ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/multi_gpu.yaml --num_processes=1 --main_process_port=7000 scripts/run_dpo_multi.py recipes/zephyr-7b-beta/dpo_multi/config_qlora.yaml --gradient_accumulation_steps=32 --beta=0.01 --temp_alpha=0.01 --output_dir=formal_data/zephyr-7b-dpo_multi_infoNCE-qlora_example_model