#!/bin/bash

# Load conda environment
source /data/user/miniconda3/etc/profile.d/conda.sh
conda activate rllm2
cd /data/user/rllm

# Load env vars (HF token, etc.)
set -a
. /data/user/rllm/.env
set +a

set -x

# Print GPU info
srun -l bash -c 'echo "Node: $(hostname -s)"; nvidia-smi -L'
set -euo pipefail
set -euo pipefail

echo "This script has been superseded by:"
echo "  scripts/train/bugs/eval/bugs/run_eval_bigcodebench_bugfixer_all_in_one.sh"
echo "Please use the all-in-one script going forward."
exit 2

# Orchestrate:
#   1) launch base vLLM server
#   2) wait until base is ready
#   3) launch fix vLLM server
#   4) wait until fix is ready
#   5) run examples/bugs/eval_bigcodebench_bugfixer.py
#   6) cleanup both servers on exit
#
# Assumptions:
# - You have a python env with `vllm`, `datasets`, and this repo on PYTHONPATH (or run from repo root).
# - vLLM provides an OpenAI-compatible endpoint at http://HOST:PORT/v1
#
# Config via env (safe defaults):
#   BASE_MODEL_PATH, BASE_SERVED_MODEL_NAME, BASE_HOST, BASE_PORT, BASE_TP, BASE_CUDA_VISIBLE_DEVICES
#   FIX_MODEL_PATH,  FIX_SERVED_MODEL_NAME,  FIX_HOST,  FIX_PORT,  FIX_TP,  FIX_CUDA_VISIBLE_DEVICES
#   HF_DATASET, HF_SPLIT, START, MAX_EXAMPLES, OUTPUT_JSONL
#   BASE_TEMPERATURE, BASE_TOP_P, BASE_MAX_TOKENS
#   FIX_TEMPERATURE, FIX_TOP_P, FIX_MAX_TOKENS
#
# Example:
#   BASE_MODEL_PATH=Qwen/Qwen2.5-Coder-7B-Instruct BASE_CUDA_VISIBLE_DEVICES=0 BASE_PORT=30000 \
#   FIX_MODEL_PATH=/path/to/bugfixer FIX_CUDA_VISIBLE_DEVICES=1 FIX_PORT=30001 \
#   ./scripts/train/bugs/eval/bugs/run_eval_bigcodebench_bugfixer_two_vllm.sh

RLLM_DIR="${RLLM_DIR:-/data/user/rllm}"
cd "$RLLM_DIR"

# Optional: load env vars (HF token, etc.)
if [[ -f "$RLLM_DIR/.env" ]]; then
  set -a
  . "$RLLM_DIR/.env"
  set +a
fi

BASE_HOST="${BASE_HOST:-127.0.0.1}"
BASE_PORT="${BASE_PORT:-30000}"
FIX_HOST="${FIX_HOST:-127.0.0.1}"
FIX_PORT="${FIX_PORT:-30001}"

BASE_OPENAI_URL="http://${BASE_HOST}:${BASE_PORT}/v1"
FIX_OPENAI_URL="http://${FIX_HOST}:${FIX_PORT}/v1"

HF_DATASET="${HF_DATASET:-anonymous/bigcodebench}"
HF_SPLIT="${HF_SPLIT:-v0.1.0_hf}"
START="${START:-0}"
MAX_EXAMPLES="${MAX_EXAMPLES:-200}"
OUTPUT_JSONL="${OUTPUT_JSONL:-}"

BASE_TEMPERATURE="${BASE_TEMPERATURE:-0.2}"
BASE_TOP_P="${BASE_TOP_P:-0.95}"
BASE_MAX_TOKENS="${BASE_MAX_TOKENS:-2048}"

FIX_TEMPERATURE="${FIX_TEMPERATURE:-0.6}"
FIX_TOP_P="${FIX_TOP_P:-0.95}"
FIX_MAX_TOKENS="${FIX_MAX_TOKENS:-2048}"

LOG_DIR="${LOG_DIR:-$RLLM_DIR/runs/eval_bigcodebench_bugfixer}"
mkdir -p "$LOG_DIR"

BASE_LOG="${BASE_LOG:-$LOG_DIR/base_vllm_${BASE_PORT}.log}"
FIX_LOG="${FIX_LOG:-$LOG_DIR/fix_vllm_${FIX_PORT}.log}"
EVAL_LOG="${EVAL_LOG:-$LOG_DIR/eval.log}"

wait_for_server() {
  local url="$1"
  local name="$2"
  local timeout_s="${3:-600}"
  local start_ts
  start_ts="$(date +%s)"
  echo "[wait] Waiting for $name at ${url}/models (timeout=${timeout_s}s)"
  while true; do
    if curl -fsS "${url}/models" >/dev/null 2>&1; then
      echo "[wait] $name is up."
      return 0
    fi
    local now_ts
    now_ts="$(date +%s)"
    if (( now_ts - start_ts > timeout_s )); then
      echo "[wait] ERROR: timed out waiting for $name at ${url}/models" >&2
      return 1
    fi
    sleep 2
  done
}

cleanup() {
  set +e
  echo "[cleanup] Stopping servers..."
  if [[ -n "${FIX_PID:-}" ]]; then kill "$FIX_PID" 2>/dev/null || true; fi
  if [[ -n "${BASE_PID:-}" ]]; then kill "$BASE_PID" 2>/dev/null || true; fi
  sleep 2
  if [[ -n "${FIX_PID:-}" ]]; then kill -9 "$FIX_PID" 2>/dev/null || true; fi
  if [[ -n "${BASE_PID:-}" ]]; then kill -9 "$BASE_PID" 2>/dev/null || true; fi
}
trap cleanup EXIT INT TERM

echo "[run] Launch base server first..."
(
  export BASE_HOST="$BASE_HOST"
  export BASE_PORT="$BASE_PORT"
  # The remaining BASE_* vars can be set by caller; defaults in serve script.
  exec bash "$RLLM_DIR/scripts/train/bugs/eval/bugs/serve_vllm_base.sh"
) >"$BASE_LOG" 2>&1 &
BASE_PID=$!
echo "[run] base pid=$BASE_PID log=$BASE_LOG"
wait_for_server "$BASE_OPENAI_URL" "base"

echo "[run] Launch fix server second..."
(
  export FIX_HOST="$FIX_HOST"
  export FIX_PORT="$FIX_PORT"
  # The remaining FIX_* vars can be set by caller; defaults in serve script.
  exec bash "$RLLM_DIR/scripts/train/bugs/eval/bugs/serve_vllm_fix.sh"
) >"$FIX_LOG" 2>&1 &
FIX_PID=$!
echo "[run] fix pid=$FIX_PID log=$FIX_LOG"
wait_for_server "$FIX_OPENAI_URL" "fix"

# Served model names default to model paths in the serve scripts.
BASE_SERVED_MODEL_NAME="${BASE_SERVED_MODEL_NAME:-${BASE_MODEL_PATH:-Qwen/Qwen2.5-Coder-7B-Instruct}}"
FIX_SERVED_MODEL_NAME="${FIX_SERVED_MODEL_NAME:-${FIX_MODEL_PATH:-Qwen/Qwen2.5-Coder-7B-Instruct}}"

echo "[run] Running eval..."
set -x

EVAL_CMD=(python "$RLLM_DIR/examples/bugs/eval_bigcodebench_bugfixer.py"
  --hf_dataset "$HF_DATASET"
  --hf_split "$HF_SPLIT"
  --start "$START"
  --max_examples "$MAX_EXAMPLES"
  --base_model "$BASE_SERVED_MODEL_NAME"
  --base_model_url "$BASE_OPENAI_URL"
  --base_temperature "$BASE_TEMPERATURE"
  --base_top_p "$BASE_TOP_P"
  --base_max_tokens "$BASE_MAX_TOKENS"
  --fix_model "$FIX_SERVED_MODEL_NAME"
  --fix_model_url "$FIX_OPENAI_URL"
  --fix_temperature "$FIX_TEMPERATURE"
  --fix_top_p "$FIX_TOP_P"
  --fix_max_tokens "$FIX_MAX_TOKENS"
)

if [[ -n "$OUTPUT_JSONL" ]]; then
  EVAL_CMD+=(--output_jsonl "$OUTPUT_JSONL")
fi

"${EVAL_CMD[@]}" 2>&1 | tee "$EVAL_LOG"

set +x
echo "[run] Done. Logs:"
echo "  base: $BASE_LOG"
echo "  fix : $FIX_LOG"
echo "  eval: $EVAL_LOG"


