export OPENAI_AZURE_ENDPOINT= # azure openai endpoint
export OPENAI_API_KEY= # azure openai key
export OPENAI_API_VERSION= # azure openai version
export PROCESSOR=gpt-4o-mini 


# Check and parse command-line arguments
if [ "$#" -ne 6 ]; then
    echo "Usage: $0 <model_path> <gpu_id> <vllm_port> <accelerate_main_port> <output_suffix> <current_path>"
    exit 1
fi

MODEL="$1"
GPU_ID="$2"
LOCAL_PORT="$3"
ACCELERATE_MAIN_PORT="$4"
OUTPUT_SUFFIX="$5"
CURRENT_PATH="$6"

GPU_MEMORY_UTILIZATION=${GPU_MEMORY_UTILIZATION:-0.85}
VLLM_HEALTH_CHECK_URL="http://localhost:${LOCAL_PORT}/health"
VLLM_READINESS_TIMEOUT=180
SLEEP_AFTER_RUN=5 # Sleep before cleaning up vLLM

# --- Global Variables ---
vllm_pid="" # Variable to store the PID of the vLLM background process

# --- Cleanup Function ---
# This function is called automatically on script exit, interrupt (Ctrl+C), or termination signal
cleanup() {
    echo "Cleaning up vLLM process (PID: $vllm_pid)..."
    if [ -n "$vllm_pid" ]; then # Check if PID variable is not empty
        # Check if the process with this PID is still running
        if ps -p $vllm_pid > /dev/null; then
            echo "Attempting graceful shutdown (SIGTERM) for PID $vllm_pid..."
            # Send SIGTERM first to allow for graceful shutdown
            kill -TERM "$vllm_pid"
            # Wait a few seconds for it to shut down
            sleep 5
            # Check again if the process is still running
            if ps -p $vllm_pid > /dev/null; then
                echo "Process $vllm_pid did not shut down gracefully. Sending SIGKILL..."
                # Send SIGKILL as a last resort
                kill -KILL "$vllm_pid"
            else
                echo "Process $vllm_pid shut down gracefully."
            fi
        else
            echo "vLLM process $vllm_pid is not running (already stopped?)."
        fi
        vllm_pid="" # Clear PID after attempting cleanup
    else
        echo "No vLLM process PID recorded for cleanup."
    fi
}

# --- Trap Setup ---
trap cleanup EXIT INT TERM

echo "[Run ${OUTPUT_SUFFIX}] Starting script for model: ${MODEL}"
echo "[Run ${OUTPUT_SUFFIX}] Using GPU: ${GPU_ID}, vLLM Port: ${LOCAL_PORT}, Accelerate Port: ${ACCELERATE_MAIN_PORT}"

# --- Start vLLM Server ---
echo "[Run ${OUTPUT_SUFFIX}] Starting vLLM server..."

# Set CUDA_VISIBLE_DEVICES for THIS script's execution environment
export CUDA_VISIBLE_DEVICES="$GPU_ID"

# Run vLLM in the background using '&' and capture its PID ($!)
python -m vllm.entrypoints.openai.api_server \
    --model "${MODEL}" \
    --trust-remote-code \
    --dtype=bfloat16 \
    --port="${LOCAL_PORT}" \
    --gpu-memory-utilization="${GPU_MEMORY_UTILIZATION}" \
    --seed 63 &


# Capture the PID of the background process
vllm_pid=$!

# Check if the background process command was successfully initiated
# Note: This only checks if 'python ... &' started, not if vLLM itself succeeded.
# The health check covers the actual vLLM startup success.
if [ $? -ne 0 ]; then
    echo "Error: Failed to initiate the vLLM background process."
    vllm_pid="" # Ensure cleanup doesn't run with a potentially invalid PID
    exit 1
fi

echo "[Run ${OUTPUT_SUFFIX}] vLLM process started with PID: $vllm_pid"
echo "[Run ${OUTPUT_SUFFIX}] Waiting for vLLM server to become ready at $VLLM_HEALTH_CHECK_URL (timeout: ${VLLM_READINESS_TIMEOUT}s)..."

# --- Wait for vLLM Readiness ---
start_time=$(date +%s)
while true; do
    # Check if the vLLM process is still running
    if ! ps -p "$vllm_pid" > /dev/null; then
        echo "[Run ${OUTPUT_SUFFIX}] Error: vLLM process (PID $vllm_pid) died unexpectedly during startup."
        exit 1 # Trap will handle cleanup
    fi

    # Use curl to check the health endpoint
    if curl -sf -o /dev/null "$VLLM_HEALTH_CHECK_URL"; then
        echo "[Run ${OUTPUT_SUFFIX}] vLLM server is ready."
        break
    fi

    # Check for timeout
    current_time=$(date +%s)
    elapsed_time=$((current_time - start_time))
    if [ "$elapsed_time" -ge "$VLLM_READINESS_TIMEOUT" ]; then
        echo "[Run ${OUTPUT_SUFFIX}] Error: vLLM server did not become ready within $VLLM_READINESS_TIMEOUT seconds."
        exit 1 # Trap will handle cleanup
    fi

    sleep 5
done

# --- Run the Interaction Program ---
echo "[Run ${OUTPUT_SUFFIX}] vLLM is ready. Starting sample_and_adapter_train.py..."


# aime24
accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/aime24/major_voting" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --temperature 0.7 \
    --top_p 0.9 \
    --self-consistency \
    --rollout-num 10 \
    --task aime24 &
pid1=$!

accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/aime24/greedy" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool  \
    --task aime24 &
pid2=$!

wait $pid1 $pid2
echo "aime24 finish"

# aime25
accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/aime25/major_voting" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --temperature 0.7 \
    --top_p 0.9 \
    --self-consistency \
    --rollout-num 10 \
    --task aime25 &
pid1=$!

accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/aime25/greedy" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --task aime25 &
pid2=$!

wait $pid1 $pid2
echo "aime25 finish"

# minerva_math
accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/minerva_math/major_voting" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --temperature 0.7 \
    --top_p 0.9 \
    --self-consistency \
    --rollout-num 10 \
    --task minerva_math &
pid1=$!

accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/minerva_math/greedy" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --task minerva_math &
pid2=$!

wait $pid1 $pid2
echo "minerva_math finish"

# openai_math
accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/openai_math/major_voting" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --temperature 0.7 \
    --top_p 0.9 \
    --self-consistency \
    --rollout-num 10  \
    --task openai_math &
pid1=$!

accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/openai_math/greedy" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool  \
    --task openai_math &
pid2=$!

wait $pid1 $pid2
echo "openai_math finish"

# olympiad_bench
accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/olympiad_bench/major_voting" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --temperature 0.7 \
    --top_p 0.9 \
    --self-consistency \
    --rollout-num 10 \
    --task olympiad_bench & 
pid1=$!

accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/olympiad_bench/greedy" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --threadpool \
    --task olympiad_bench &
pid2=$!

wait $pid1 $pid2
echo "olympiad_bench finish"

# s1k_eval
accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/s1k_eval/major_voting" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --real_test \
    --threadpool \
    --temperature 0.7 \
    --top_p 0.9 \
    --self-consistency \
    --rollout-num 10  \
    --task s1k_eval & 
pid1=$!

accelerate launch --mixed_precision fp16 \
    --main_process_port "${ACCELERATE_MAIN_PORT}" sample_and_adapter_train.py \
    --config configs_qwen/S1kBenchmark_eval.yaml \
    --search_weight 0.0 \
    --debug "${CURRENT_PATH}/benchmark/s1k_eval/greedy" \
    --seed=63 \
    --port ${LOCAL_PORT} \
    --whitebox ${MODEL} \
    --real_test \
    --threadpool  \
    --task s1k_eval &
pid2=$!

wait $pid1
exit_code1=$?
echo "major voting finish"

wait $pid2
exit_code2=$?
echo "greedy finish"

if [ $exit_code1 -ne 0 ] || [ $exit_code2 -ne 0 ]; then
    echo "[Run ${OUTPUT_SUFFIX}] sample_and_adapter_train.py exited with error."
    overall_exit_code=1 
else
    echo "[Run ${OUTPUT_SUFFIX}] sample_and_adapter_train.py finished successfully."
    overall_exit_code=0
fi
# --- Post-Run Sleep ---
echo "[Run ${OUTPUT_SUFFIX}] sample_and_adapter_train.py finished. Sleeping for $SLEEP_AFTER_RUN seconds before cleanup..."
sleep $SLEEP_AFTER_RUN

# --- Script Exit ---
# The trap handles the final cleanup upon script exit.
echo "[Run ${OUTPUT_SUFFIX}] Script finished. Exiting with code $overall_exit_code."
exit $overall_exit_code