#!/usr/bin/env bash
set -euo pipefail

# 选择测试哪些子集
# 1 代表执行，0 代表不执行
RUN_AIS=0
RUN_FIT=0

RUN_PMR=1
RUN_PMR_ROLLBACK=1





USER_IP_POOL_LIST=(
    "33.18.242.62",
    "33.32.6.100",
    "33.32.54.108",
    "33.32.28.89"
)

USER_MODEL_NAME="${USER_MODEL_NAME:-}"
USER_BASE_URL="${USER_BASE_URL:-}"


# 选择 user 是否走计费端口
# USER_MODEL_NAME="DeepSeek-V3.2-Meituan"
# USER_BASE_URL="https://basicaiservice.sankuai.com/basicai/v1"

OPEN_SOURCE_REQUESTS_PER_IP=2
CLOSED_SOURCE_REQUESTS_PER_IP=1



# 自己训的模型 ===================================================================
# OPEN_SOURCE=1
# AGENT_THINKING=0

# AGENT_MODEL_NAME="qwen2514_toucan_119k" AGENT_IP="33.32.0.125"
# AGENT_MODEL_NAME="qwen2532_toucan_119k" AGENT_IP="33.32.37.62"

# AGENT_MODEL_NAME="qwen2514_toucan_119k_travel_3k" AGENT_IP="33.32.33.2"
# AGENT_MODEL_NAME="qwen2532_toucan_119k_travel_3k" AGENT_IP="33.32.20.118"

# AGENT_MODEL_NAME="qwen2514_toucan_119k_travel_3k_mt_ctr_rd_mi_220" AGENT_IP="33.18.251.9"
# AGENT_MODEL_NAME="qwen2532_toucan_119k_travel_3k_mt_ctr_rd_mi_220" AGENT_IP="33.32.16.13"


# AGENT_MODEL_NAME="qwen2514_toucan_119k_travel_3k_mt_ctr_rd_220" AGENT_IP="33.18.236.35"

# AGENT_MODEL_NAME="qwen2514_toucan_119k_travel_3k_mt_ctr_220" AGENT_IP="33.32.49.120"

# AGENT_MODEL_NAME="qwen2514_toucan_119k_travel_3k_mt_220" AGENT_IP="33.32.15.25"

# AGENT_MODEL_NAME="qwen2514_toucan_119k_travel_3k_st_140" AGENT_IP="33.32.25.65"


# 开源 think ===================================================================
# OPEN_SOURCE=1
# AGENT_THINKING=1

# st
# AGENT_MODEL_NAME="deepseek-v32" AGENT_IP="33.32.1.86" USER_IP_POOL_LIST=("33.32.1.86")

# AGENT_MODEL_NAME="deepseek-v32" AGENT_IP="33.32.39.59" USER_IP_POOL_LIST=("33.32.39.59")


# AGENT_MODEL_NAME="qwen3-235b-think"  AGENT_IP="33.32.40.143"  # 记得调整 max_token 为 32k


# 开源 nothink ===================================================================
OPEN_SOURCE=1
AGENT_THINKING=0

AGENT_MODEL_NAME="deepseek-v32" AGENT_IP="33.18.232.8" USER_IP_POOL_LIST=("33.18.232.8")
# AGENT_MODEL_NAME="deepseek-v32" AGENT_IP="33.18.237.127" USER_IP_POOL_LIST=("33.18.237.127")


# AGENT_MODEL_NAME="qwen2514"  AGENT_IP="10.166.152.109"
# AGENT_MODEL_NAME="qwen2532"  AGENT_IP="10.164.53.74"

# AGENT_MODEL_NAME="deepseek-v32"  AGENT_IP="33.18.235.12"

# AGENT_MODEL_NAME="qwen3-235b-instruct" AGENT_IP="33.18.241.27"  # 记得调整 max_token 为 32k

# AGENT_MODEL_NAME="qwen2.5-32b-instruct" AGENT_IP="33.253.132.106" # 记得调整 max_token 为 32k

# AGENT_MODEL_NAME="qwen3-32b" AGENT_IP="33.32.40.143"  # 记得调整 max_token 为 32k



# 闭源 think ===================================================================
# OPEN_SOURCE=0
# AGENT_THINKING=1
# AGENT_IP="0.1.2.3"

# AGENT_MODEL_NAME="LongCat-Flash-Thinking-2601"
# AGENT_MODEL_NAME="glm-4.7"
# AGENT_MODEL_NAME="gemini-3-flash-preview"
# AGENT_MODEL_NAME="gemini-3-pro-preview"
# AGENT_MODEL_NAME="aws.claude-sonnet-4.5"
# AGENT_MODEL_NAME="kimi-k2-thinking"


# 闭源 nothink ===================================================================
# OPEN_SOURCE=0
# AGENT_THINKING=0
# AGENT_IP="0.1.2.3"

# AGENT_MODEL_NAME="glm-4.7"
# AGENT_MODEL_NAME="kimi-k2-0905-preview"







if [ "$OPEN_SOURCE" -eq 1 ]; then
    AGENT_BASE_URL="http://$AGENT_IP:8000/v1"
else
    AGENT_BASE_URL="https://basicaiservice.sankuai.com/basicai/v1"
fi



if [ "$OPEN_SOURCE" -eq 1 ]; then
    REQUESTS_PER_IP="$OPEN_SOURCE_REQUESTS_PER_IP"
else
    REQUESTS_PER_IP="$CLOSED_SOURCE_REQUESTS_PER_IP"
fi

if [ "$AGENT_THINKING" -eq 1 ]; then
    TASK_ID="${AGENT_MODEL_NAME}-think-hard"
else
    TASK_ID="${AGENT_MODEL_NAME}-nothink-hard"
fi

AGENT_MAX_TOKENS=""
case "$AGENT_MODEL_NAME" in
    qwen2514_toucan_119k|qwen2532_toucan_119k|qwen2514_toucan_119k_travel_3k|qwen2532_toucan_119k_travel_3k)
        AGENT_MAX_TOKENS=$((32 * 1024))
        ;;
    qwen*|gemini*)
        AGENT_MAX_TOKENS=$((32 * 1024))
        ;;
esac

SCRIPT_DIR="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" && pwd -P)"
WORKSPACE_DIR="$(cd -- "$SCRIPT_DIR/../.." && pwd -P)"

LOG_DIR="$WORKSPACE_DIR/ttv2_eval_1/log"
mkdir -p "$LOG_DIR"

AIS_LOG="$LOG_DIR/${TASK_ID}_AIS.log"
FIT_LOG="$LOG_DIR/${TASK_ID}_FIT.log"
PMR_LOG="$LOG_DIR/${TASK_ID}_PMR.log"
PMR_ROLLBACK_LOG="$LOG_DIR/${TASK_ID}_PMR_ROLLBACK.log"

USER_IP_POOL="$(IFS=,; echo "${USER_IP_POOL_LIST[*]}")"

if [ "$RUN_AIS" -eq 1 ]; then
  USER_IP_POOL="$USER_IP_POOL" \
  USER_MODEL_NAME="$USER_MODEL_NAME" \
  USER_BASE_URL="$USER_BASE_URL" \
  AGENT_MODEL_NAME="$AGENT_MODEL_NAME" \
  AGENT_IP="$AGENT_IP" \
  AGENT_BASE_URL="$AGENT_BASE_URL" \
  OPEN_SOURCE="$OPEN_SOURCE" \
  REQUESTS_PER_IP="$REQUESTS_PER_IP" \
  AGENT_THINKING="$AGENT_THINKING" \
  AGENT_MAX_TOKENS="$AGENT_MAX_TOKENS" \
  TESTS="$TESTS_AIS" \
  nohup python3 -u "$SCRIPT_DIR/hard_AIS.py" --task_id "$TASK_ID" >"$AIS_LOG" 2>&1 &
  AIS_PID="$!"
  echo "hard_AIS pid=$AIS_PID log=$AIS_LOG"
fi

if [ "$RUN_FIT" -eq 1 ]; then
  USER_IP_POOL="$USER_IP_POOL" \
  USER_MODEL_NAME="$USER_MODEL_NAME" \
  USER_BASE_URL="$USER_BASE_URL" \
  AGENT_MODEL_NAME="$AGENT_MODEL_NAME" \
  AGENT_IP="$AGENT_IP" \
  AGENT_BASE_URL="$AGENT_BASE_URL" \
  OPEN_SOURCE="$OPEN_SOURCE" \
  REQUESTS_PER_IP="$REQUESTS_PER_IP" \
  AGENT_THINKING="$AGENT_THINKING" \
  AGENT_MAX_TOKENS="$AGENT_MAX_TOKENS" \
  TESTS="$TESTS_FIT" \
  nohup python3 -u "$SCRIPT_DIR/hard_FIT_no_issue.py" --task_id "$TASK_ID" >"$FIT_LOG" 2>&1 &
  FIT_PID="$!"
  echo "hard_FIT pid=$FIT_PID log=$FIT_LOG"
fi

if [ "$RUN_PMR" -eq 1 ]; then
  USER_IP_POOL="$USER_IP_POOL" \
  USER_MODEL_NAME="$USER_MODEL_NAME" \
  USER_BASE_URL="$USER_BASE_URL" \
  AGENT_MODEL_NAME="$AGENT_MODEL_NAME" \
  AGENT_IP="$AGENT_IP" \
  AGENT_BASE_URL="$AGENT_BASE_URL" \
  OPEN_SOURCE="$OPEN_SOURCE" \
  REQUESTS_PER_IP="$REQUESTS_PER_IP" \
  AGENT_THINKING="$AGENT_THINKING" \
  AGENT_MAX_TOKENS="$AGENT_MAX_TOKENS" \
  TESTS="$TESTS_PMR" \
  nohup python3 -u "$SCRIPT_DIR/hard_PMR_no_issue.py" --task_id "$TASK_ID" >"$PMR_LOG" 2>&1 &
  PMR_PID="$!"
  echo "hard_PMR pid=$PMR_PID log=$PMR_LOG"
fi

if [ "$RUN_PMR_ROLLBACK" -eq 1 ]; then
  USER_IP_POOL="$USER_IP_POOL" \
  USER_MODEL_NAME="$USER_MODEL_NAME" \
  USER_BASE_URL="$USER_BASE_URL" \
  AGENT_MODEL_NAME="$AGENT_MODEL_NAME" \
  AGENT_IP="$AGENT_IP" \
  AGENT_BASE_URL="$AGENT_BASE_URL" \
  OPEN_SOURCE="$OPEN_SOURCE" \
  REQUESTS_PER_IP="$REQUESTS_PER_IP" \
  AGENT_THINKING="$AGENT_THINKING" \
  AGENT_MAX_TOKENS="$AGENT_MAX_TOKENS" \
  TESTS="$TESTS_PMR_ROLLBACK" \
  nohup python3 -u "$SCRIPT_DIR/hard_PMR_rollback_no_issue.py" --task_id "$TASK_ID" >"$PMR_ROLLBACK_LOG" 2>&1 &
  PMR_ROLLBACK_PID="$!"
  echo "hard_PMR_rollback pid=$PMR_ROLLBACK_PID log=$PMR_ROLLBACK_LOG"
fi
