

# NUM_GPUS=8
# for (( i=0; i<NUM_GPUS; i++ )); do
#     LOG_FILE="api_gpu${i}.log"
#     echo "Starting server on port $((8000+i)) with GPU: $i"
#     CUDA_VISIBLE_DEVICES=$i python -m sglang.launch_server \
#         --model-path /home/export/base/ycsc_1/1/online1/hf_models/Skywork-Reward-V2-Llama-3.1-8B \
#         --mem-fraction-static 0.9 \
#         --tp 1 \
#         --host 127.0.0.1 \
#         --port $((8000+i)) \
#         --context-length 16384 \
#         --is-embedding \
#         > $LOG_FILE 2>&1 &
# done

CUDA_VISIBLE_DEVICES=0 python -m sglang.launch_server \
    --model-path /home/export/base/ycsc_1/1/online1/hf_models/Skywork-Reward-V2-Llama-3.1-8B \
    --mem-fraction-static 0.9 \
    --tp 1 \
    --host 127.0.0.1 \
    --port 8000 \
    --context-length 16384 \
    --is-embedding