
if [ -z "$1" ]; then
  echo "Usage: $0 <file_id>"
  echo "Example: $0 0"
  exit 1
fi

INPUT_PATH=$1
OUTPUT_PATH=$2
STUDENT_IP=$3

export HF_HUB_CACHE=/xxx
export HF_HUB_OFFLINE=1
export VLLM_USE_MODELSCOPE=0
export VLLM_USE_HARMONY=0
export TIKTOKEN_RS_CACHE_DIR=hf_hub/o200k_base_tokeinzer


MODEL_PATH_GPT_OSS="openai/gpt-oss-120b"
HOST="0.0.0.0"
PORT_GPT_OSS=23333
TP=8
GPU_MEM_UTILIZATION_GPT_OSS=0.8
MAX_MODEL_LEN=45000
MODEL_NAME_GPT_OSS="gpt-oss"

LOCAL_IP=$(hostname -I | awk '{for(i=1;i<=NF;i++){if($i ~ /^10\./ || $i ~ /^192\./){print $i; exit}}}')
if [ -z "$LOCAL_IP" ]; then
  LOCAL_IP="localhost"
fi


LOG_FILE_GPT_OSS="logs/vllm_gpt_oss_file_${FILE_ID}.log"
nohup python -m vllm.entrypoints.openai.api_server \
    --model "$MODEL_PATH_GPT_OSS" \
    --tensor-parallel-size "$TP" \
    --host "$HOST" \
    --port "$PORT_GPT_OSS" \
    --max-model-len "$MAX_MODEL_LEN" \
    --gpu-memory-utilization "$GPU_MEM_UTILIZATION_GPT_OSS" \
    --served-model-name "$MODEL_NAME_GPT_OSS" \
    --trust-remote-code > "$LOG_FILE_GPT_OSS" 2>&1 &

python run_tessy.py \
  --input_path "$INPUT_PATH" \
  --output_path "$OUTPUT_PATH" \
  --teacher_api_url http://127.0.0.1:${PORT_GPT_OSS}/v1/completions \
  --student_api_url "$STUDENT_IP" \
  --batch_size 40 \
  --teacher_classifier_path checkpoints/teacher_label/32B_judge_oss_think/ \
  --student_classifier_path checkpoints/teacher_label/32B_judge_8B_think/ \
  --teacher_step_size 20 \
  --student_step_size 20 \
  --retry True

