export CUDA_VISIBLE_DEVICES=0,1,2,3

torchrun --nproc_per_node 4 --master_port=22642 sft.py \
        --model_name "xxxx"  \
        --batch_size 8 \
        --gradient_accumulation_steps 8 \
        --dataset Books \
        --prompt_path "prompt/book.txt" \
        --learning_rate 1e-5 \
        --num_train_epochs 2 \
        --eval_step 0.5 \
        --cutoff_len 1024 \
        