pip install flash-attn==2.5.7
pip install huggingface-hub==0.24.7
wandb login "Your Id"

mkdir cache
export HF_HOME="cache"
export WANDB_PROJECT="mpo"
 
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file accelerate_configs/deepspeed_zero3.yaml scripts/run_swepo.py training_configs/mistral-7b-base-swepo_l0.yaml 