#!/bin/bash
MODEL_PATH="../../../../models/models--nvidia--Llama-3.3-Nemotron-70B-Reward-Multilingual"
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
python3 -m sglang.launch_server \
    --model-path $MODEL_PATH \
    --tp 8 \
    --dtype bfloat16 \
    --port 30000 \
    --skip-tokenizer-init \
    --trust-remote-code
