#!/bin/bash
# Deploy SGLang server in background

set -e

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
cd "$SCRIPT_DIR"

# Default values (empty = use defaults from deploy_attacker.sh)
MODEL_PATH=""
SERVER_NODE=""
SERVER_PORT=""
WAIT_FOR_READY=true

# Parse command line arguments
while [[ $# -gt 0 ]]; do
    case $1 in
        -m|--model)
            MODEL_PATH="$2"
            shift 2
            ;;
        --server-node)
            SERVER_NODE="$2"
            shift 2
            ;;
        --server-port)
            SERVER_PORT="$2"
            shift 2
            ;;
        --no-wait)
            WAIT_FOR_READY=false
            shift
            ;;
        *)
            echo "Unknown option: $1"
            echo "Usage: $0 [OPTIONS]"
            echo "  -m, --model MODEL_PATH    Model path (default: from deploy_attacker.sh)"
            echo "  --server-node NODE        Server node for URL/checks (default: localhost)"
            echo "  --server-port PORT        Server port for URL/checks (default: 30000)"
            echo "  --no-wait                 Don't wait for server to be ready"
            exit 1
            ;;
    esac
done

# Set defaults for URL construction and checks (must be concrete even if we let deploy_attacker.sh decide)
CHECK_NODE="${SERVER_NODE:-localhost}"
CHECK_PORT="${SERVER_PORT:-30000}"  # should match deploy_attacker.sh default

# Set server URL
SERVER_URL="http://${CHECK_NODE}:${CHECK_PORT}"

# Create logs directory
mkdir -p logs

# Check if server is already running
if curl -s "$SERVER_URL/health" > /dev/null 2>&1; then
    echo "✓ SGLang server is already running on $CHECK_NODE:$CHECK_PORT"
    echo "  Server is ready and accessible"
    # Get PID if on localhost
    if [ "$CHECK_NODE" = "localhost" ] || [ "$CHECK_NODE" = "127.0.0.1" ]; then
        SERVER_PID=$(pgrep -f "sglang.launch_server.*${CHECK_PORT}" | head -1 || echo "")
        if [ -n "$SERVER_PID" ]; then
            echo "  PID: $SERVER_PID"
        fi
    fi
    echo ""
    echo "To check server status:"
    echo "  curl $SERVER_URL/health"
    echo ""
    echo "To view logs:"
    echo "  tail -f logs/sglang_server.log"
    exit 0
fi

# Check HF_HOME
if [ -z "$HF_HOME" ]; then
    echo "Error: HF_HOME environment variable is not set"
    echo "Please set it before running this script:"
    echo "  export HF_HOME=\$SCRATCH/LLMs"
    exit 1
fi

# Check if conda is available
if ! command -v conda &> /dev/null; then
    echo "Error: conda is not available"
    exit 1
fi

# Initialize conda
eval "$(conda shell.bash hook)"

# Only start server if on localhost
if [ "$CHECK_NODE" != "localhost" ] && [ "$CHECK_NODE" != "127.0.0.1" ]; then
    echo "⚠️  Remote server node specified ($CHECK_NODE)"
    echo "  Skipping local server start. Will only check if server is running."
    if curl -s "$SERVER_URL/health" > /dev/null 2>&1; then
        echo "✓ Remote server is running and accessible"
        exit 0
    else
        echo "❌ Remote server is not accessible at $SERVER_URL"
        exit 1
    fi
fi

echo "Starting SGLang server in background"
if [ -n "$MODEL_PATH" ]; then
    echo "  Model: $MODEL_PATH"
else
    echo "  Model: (default from deploy_attacker.sh)"
fi
echo "  Server node: $CHECK_NODE"
echo "  Server URL: $SERVER_URL"
echo "  Logs will be written to: logs/sglang_server.log"
echo ""

# Stop any existing server processes
pkill -f "sglang.launch_server.*${CHECK_PORT}" 2>/dev/null || true
sleep 2

# Run in background with nohup.
# Note: deploy_attacker.sh initializes conda itself, so we can call it directly and safely pass args (including spaces).
DEPLOY_ARGS=()
if [ -n "$MODEL_PATH" ]; then
    DEPLOY_ARGS+=(--model "$MODEL_PATH")
fi
if [ -n "$SERVER_PORT" ]; then
    DEPLOY_ARGS+=(--port "$SERVER_PORT")
fi

nohup bash deploy_attacker.sh "${DEPLOY_ARGS[@]}" > logs/sglang_server.log 2>&1 &
SERVER_PID=$!

echo "✓ Server process started with PID: $SERVER_PID"
echo ""

# Wait for server to be ready if requested
if [ "$WAIT_FOR_READY" = true ]; then
    echo "Waiting for server to initialize (this may take several minutes)..."
    echo "Press Ctrl+C to cancel and check logs manually"
    echo ""
    
    # Wait for server to start - loop until ready (no timeout)
    WAITED=0
    SERVER_READY=false
    
    while true; do
        # Check if process is still running
        if ! ps -p $SERVER_PID > /dev/null 2>&1; then
            echo ""
            echo "❌ Server process died! Check logs:"
            echo "  tail -20 logs/sglang_server.log"
            exit 1
        fi
        
        # Check if server is responding to health checks
        if curl -s "$SERVER_URL/health" > /dev/null 2>&1; then
            # Double check with a more detailed request
            HEALTH_RESPONSE=$(curl -s "$SERVER_URL/health" 2>&1)
            if [ $? -eq 0 ]; then
                echo ""
                echo "✓ Server is ready and responding! (waited ${WAITED}s)"
                SERVER_READY=true
                break
            fi
        fi
        
        # Show progress every 10 seconds
        if [ $((WAITED % 10)) -eq 0 ] && [ $WAITED -gt 0 ]; then
            echo -n " (${WAITED}s)"
        else
            echo -n "."
        fi
        
        sleep 2
        WAITED=$((WAITED + 2))
    done
    echo ""
    
    # Final verification - test with a simple API call
    echo "Performing final server verification..."
    sleep 2
    if curl -s "$SERVER_URL/health" > /dev/null 2>&1; then
        echo "✓ Server verification successful"
    else
        echo "⚠️  Server verification failed, but continuing..."
    fi
    echo ""
else
    echo "Skipping wait (--no-wait flag set)"
    echo "  Server is starting in background. Check status with:"
    echo "    curl $SERVER_URL/health"
    echo ""
fi

echo "Server information:"
echo "  PID: $SERVER_PID"
echo "  URL: $SERVER_URL"
echo ""
echo "To check server status:"
echo "  curl $SERVER_URL/health"
echo ""
echo "To view logs:"
echo "  tail -f logs/sglang_server.log"
echo ""
echo "To stop server:"
echo "  kill $SERVER_PID"
echo "  # or: pkill -f sglang.launch_server"

