pip install -e ".[torch,metrics]" --no-build-isolation
pip3 install deepspeed

export WANDB_DISABLED="true"
export SWANLAB_MODE="disabled"
export DISABLE_VERSION_CHECK=1


CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7,8 python scripts/vllm_infer_selfies.py \
    --model_name_or_path xxxx \
    --template qwen \
    --dataset chembl_desc2mol_test \
    --save_name xxxxx.json \
    --batch_size 512 \
    --max_new_tokens 2048 \
    --preprocessing_num_workers 8