{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "80687efa-684d-44b9-9551-718a63ad9c9d",
   "metadata": {},
   "source": [
    "### 全面复式循环赛"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "fd69903b-2068-4c93-9895-9e18e51171ed",
   "metadata": {},
   "source": [
    "#### API"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "eb897e1f-d817-4111-815f-0cdd92e0436b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import time\n",
    "import queue\n",
    "from datetime import datetime\n",
    "from DouDiZhu.cards import PokerCard\n",
    "from DouDiZhu.game_logic import DouDiZhuGame\n",
    "from DouDiZhu.llmagent import LLMAgentManager\n",
    "\n",
    "print(\"=== 斗地主游戏开始 ===\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "3e0a420a-a6bf-4868-bec0-6a27d0beb55b",
   "metadata": {},
   "outputs": [],
   "source": [
    "import uuid\n",
    "import random\n",
    "import itertools\n",
    "import threading\n",
    "from pprint import pprint\n",
    "import concurrent.futures\n",
    "\n",
    "\n",
    "def generate_fixed_cards():\n",
    "    deck = PokerCard.create_deck()\n",
    "    random.shuffle(deck)\n",
    "    players_hand = [[] for _ in range(3)]\n",
    "    for i in range(51):\n",
    "        players_hand[i % 3].append(deck.pop())\n",
    "    bottom_cards = deck[:3]\n",
    "    players_hand.append(bottom_cards)\n",
    "    \n",
    "    return players_hand\n",
    "\n",
    "def run_game(team_models, fixed_card):\n",
    "    \"\"\"运行单个游戏\"\"\"\n",
    "    game = DouDiZhuGame(\n",
    "        player_configs = {\n",
    "            \"Player1\": {'type': 'llm', 'model': team_models[0], \n",
    "                        'if_local': False, 'model_class': None, 'tokenizer': None},\n",
    "            \"Player2\": {'type': 'llm', 'model': team_models[1], \n",
    "                        'if_local': False, 'model_class': None, 'tokenizer': None},\n",
    "            \"Player3\": {'type': 'llm', 'model': team_models[2], \n",
    "                        'if_local': False, 'model_class': None, 'tokenizer': None}\n",
    "        },\n",
    "        update_queue = queue.Queue(),\n",
    "        save_folder_path = f'./data_save_{uuid.uuid4().hex}',\n",
    "        fixed_card=fixed_card,\n",
    "        )\n",
    "    game.play_game()\n",
    "    print([f'{player.model_name}:{player.score}' for player in game.players])\n",
    "    return game\n",
    "    "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2cbd2d0a-5f10-4af7-bd2d-f13023ea384a",
   "metadata": {},
   "outputs": [],
   "source": [
    "score_lock = threading.Lock()\n",
    "\n",
    "def run_single_matchup(matchup_data, shared_score_dict, shared_error_num_dict):\n",
    "    \"\"\"\n",
    "    执行单轮对抗的任务函数。此函数将在独立的线程中运行。\n",
    "    \n",
    "    Args:\n",
    "        matchup_data (tuple): 包含 (轮次索引, (队伍1, 队伍2)) 的元组。\n",
    "        shared_score_dict (dict): 对全局 score 字典的引用。\n",
    "    \"\"\"\n",
    "    i, (team1_models, team2_models) = matchup_data\n",
    "    time.sleep(i+2)\n",
    "    \n",
    "    print(f\"--- [任务开始] 第 {i+1} 轮: {', '.join(team1_models)} vs {', '.join(team2_models)} ---\")\n",
    "    print(f\"当前时间 {datetime.now().strftime('%Y-%m-%d-%H:%M:%S')}\")\n",
    "    \n",
    "    players_hand = generate_fixed_cards()\n",
    "\n",
    "    with concurrent.futures.ThreadPoolExecutor(max_workers=2) as executor:\n",
    "        future1 = executor.submit(run_game, team1_models, players_hand)\n",
    "        time.sleep(1)\n",
    "        future2 = executor.submit(run_game, team2_models, players_hand)\n",
    "        game1 = future1.result()\n",
    "        game2 = future2.result()\n",
    "\n",
    "    local_score_updates = []\n",
    "    for player1, player2 in zip(game1.players, game2.players):\n",
    "        score_dist = player1.score - player2.score\n",
    "        local_score_updates.append((player1.model_name, score_dist))\n",
    "        local_score_updates.append((player2.model_name, -score_dist))\n",
    "    print('本轮得分：', local_score_updates)\n",
    "    \n",
    "    local_error_num_updates = dict()\n",
    "    for player1, player2 in zip(game1.players, game2.players):\n",
    "        local_error_num_updates[player1.model_name] = player1.error_num\n",
    "        local_error_num_updates[player2.model_name] = player2.error_num\n",
    "    print('本轮出错：', local_error_num_updates)\n",
    "    # 锁\n",
    "    with score_lock:\n",
    "        print(f\"--- [正在更新分数] 第 {i+1} 轮 ---\")\n",
    "        for model_name, delta in local_score_updates:\n",
    "            shared_score_dict[model_name] += delta\n",
    "        print('更新得分：', shared_score_dict)\n",
    "        for k,v in local_error_num_updates.items():\n",
    "            shared_error_num_dict[k] += v\n",
    "        print('更新出错：', local_error_num_updates)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "943149e9-688e-41b2-89ef-41e73ea05ed7",
   "metadata": {},
   "outputs": [],
   "source": [
    "all_res = []\n",
    "for _ in range(20):\n",
    "    \"\"\"6个模型全面循环复式赛制。\"\"\"\n",
    "    models = [\"gpt-5\", \"gemini-2.5-pro\", \"o4-mini\",\n",
    "              \"deepseek-reasoner\", \"glm-4.5\", \"doubao-seed-1-6-thinking-250715\"]\n",
    "    \n",
    "    score = {model: 0 for model in models}\n",
    "    error_num = {model: 0 for model in models}\n",
    "    \n",
    "    all_combinations = list(itertools.combinations(models, 3))\n",
    "    \n",
    "    matchups = []\n",
    "    seen_teams = set()\n",
    "    for team1_tuple in all_combinations:\n",
    "        team1 = set(team1_tuple)\n",
    "        if frozenset(team1) not in seen_teams:\n",
    "            team2 = set(models) - team1\n",
    "            seen_teams.add(frozenset(team1))\n",
    "            seen_teams.add(frozenset(team2))\n",
    "            matchups.append((sorted(list(team1)), sorted(list(team2))))\n",
    "    \n",
    "    print(f\"比赛开始！共 {len(matchups)} 轮对抗。\\n\")\n",
    "    \n",
    "    with concurrent.futures.ThreadPoolExecutor(max_workers=1) as executor:\n",
    "        tasks_to_submit = [(i, matchup_data) for i, matchup_data in enumerate(matchups)]\n",
    "        future_tasks = [executor.submit(run_single_matchup, task_data, score, error_num) for task_data in tasks_to_submit]\n",
    "        concurrent.futures.wait(future_tasks)\n",
    "    \n",
    "    print(\"================ 比赛结束 ================\")\n",
    "    print(f\"结束时间 {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}\")\n",
    "    print(\"最终总分:\")\n",
    "    pprint(score)\n",
    "    pprint(error_num)\n",
    "    \n",
    "    final_ranking = sorted(score.items(), key=lambda item: item[1], reverse=True)\n",
    "    print(\"\\n最终排名:\")\n",
    "    for rank, (model, final_score) in enumerate(final_ranking, 1):\n",
    "        all_res.append(text_res:=f\"  第 {rank} 名: 模型 {model}, 总分: {final_score}, 出错: {error_num[model]}\")\n",
    "        print(text_res)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "092415dd-7d13-443a-aeab-ddc17cd0bd15",
   "metadata": {},
   "outputs": [],
   "source": [
    "import re\n",
    "import pprint\n",
    "from collections import defaultdict\n",
    "\n",
    "def parse_model_results(text_data: str) -> dict:\n",
    "    cal_num = 0\n",
    "    model_stats = defaultdict(lambda: {\"总分\": 0, \"出错\": 0})\n",
    "    pattern = re.compile(r\"模型\\s+(.*?),\\s+总分:\\s+(-?\\d+),\\s+出错:\\s+(\\d+)\")\n",
    "    \n",
    "    for line in text_data.splitlines():\n",
    "        match = pattern.search(line)\n",
    "        \n",
    "        if match:\n",
    "            cal_num += 1\n",
    "            model_name = match.group(1).strip()\n",
    "            score = int(match.group(2))\n",
    "            errors = int(match.group(3))\n",
    "            \n",
    "            model_stats[model_name][\"总分\"] += score\n",
    "            model_stats[model_name][\"出错\"] += errors\n",
    "    print(cal_num)\n",
    "    return dict(model_stats)\n",
    "\n",
    "text_data = '\\n'.join(all_res)\n",
    "final_results = parse_model_results(text_data)\n",
    "all_final_ranking = sorted(final_results.items(), key=lambda item: item[1]['总分'], reverse=True)\n",
    "all_final_ranking"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.11"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
