# conda create -n dpo2 python=3.10 && conda activate dpo2

#### vision 1 #####
# pip install torch==2.2.2 torchvision==0.17.2 torchaudio==2.2.2 --index-url https://download.pytorch.org/whl/cu121
# pip install -U amlt --index-url https://msrpypi.azurewebsites.net/stable/leloojoo

# git clone https://github.com/huggingface/alignment-handbook.git
# cd ./alignment-handbook/
# python -m pip install .
# cd ..
# rm -rf ./alignment-handbook
# pip uninstall alignment-handbook

# pip install wandb trl==0.9.6 huggingface-hub==0.24.7 peft==0.7.1 transformers==4.45.2

# python -m pip install flash-attn --no-build-isolation

#### vision 2 #####
pip install torch==2.5.1 torchvision==0.20.1 torchaudio==2.5.1 --index-url https://download.pytorch.org/whl/cu121
pip install vllm==0.7.1 
pip install trl==0.9.6 huggingface-hub==0.24.7 peft==0.7.1 transformers==4.45.2 pathlib
git clone https://github.com/huggingface/alignment-handbook.git
cd ./alignment-handbook/
python -m pip install .
cd ..
rm -rf ./alignment-handbook
pip uninstall alignment-handbook
wget https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp310-cp310-linux_x86_64.whl
pip install flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp310-cp310-linux_x86_64.whl
rm flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp310-cp310-linux_x86_64.whl
mkdir ./huggingface/
cd ./huggingface/
git lfs install
git clone https://huggingface.co/RLHFlow/ArmoRM-Llama3-8B-v0.1
mkdir princeton-nlp
cd princeton-nlp
git lfs install
git clone https://huggingface.co/lzc0525/llama3-3b-ultrafeedback
git clone https://huggingface.co/lzc0525/llama3-math
cd ~/dpo/
pip install trl==0.9.6 huggingface-hub==0.24.7 peft==0.7.1 transformers==4.45.2 # be sure
