conda create -p /root/user/code_agent/env/qwen3vl python=3.12
conda activate /root/user/code_agent/env/qwen3vl

pip install -i https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple -U vllm

pip install -i https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple qwen-vl-utils==0.0.14

# vllm serve Qwen/Qwen3-VL-235B-A22B-Instruct \
#   --tensor-parallel-size 8 \
#   --limit-mm-per-prompt.video 0 \
#   --async-scheduling