import re
import json
import time
import random
import openai
from openai import OpenAI
from zai import ZhipuAiClient
from json import JSONDecodeError
from itertools import combinations
from typing import List, Dict, Any

from .cards import *
from .player import *


class LLMAgentManager:
    model_id2name = {
        'deepseek-r1':"deepseek-reasoner",
        'seed-1.6t': 'doubao-seed-1-6-thinking-250715',
        "glm-4.5": "glm-4.5",
        }

    def __init__(self, file_path=None, if_local=False, api_name=None, model=None, tokenizer=None):
        self.if_local = if_local
        self.api_name = api_name
        self.file_path = file_path
        if self.if_local:
            self.model = model
            self.tokenizer = tokenizer
        else:
            self.client = openai.Client(api_key, base_url)
        self.max_retries = 10
        self.retry_delay = 5  # 重试延迟（秒）
        self.must_play = False
        with open("./system_prompt.txt", 'r', encoding='utf-8') as f:
            self.system_prompt = f.read()


    def write_jsonl_line(self, data):
        """写入一行 JSON 到文件"""
        if not self.file_path:
            return
        with open(self.file_path, "a", encoding="utf-8") as f:
            f.write(json.dumps(data, ensure_ascii=False) + "\n")

    def _generate(
        self,
        content,
        previous, 
        model_id
        ):
        if content != '':
            messages = previous+[{"role": "user", "content": content}]
        else:
            messages = previous
        # api or local
        if self.if_local:
            text = self.tokenizer.apply_chat_template(
                messages,
                tokenize=False,
                add_generation_prompt=True
            )
            model_inputs = self.tokenizer([text], return_tensors="pt").to(self.model.device)
            generated_ids = self.model.generate(model_inputs.input_ids, max_new_tokens=4096)
            response = self.tokenizer.decode(generated_ids[0][list(generated_ids[0]).index(151668)+1:]
            return response
        else:
            response = self.client.chat.completions.create(
                model = model_name,
                messages = messages,
            )
            organized_data = {
                'input': messages,
                'reasoning_content': getattr(response.choices[0].message, 'reasoning_content', None),
                'content': response.choices[0].message.content,
                'model': model_name,
                'usage': [response.usage.prompt_tokens, response.usage.completion_tokens],
            }
            self.write_jsonl_line(organized_data)
            return response.choices[0].message.content


    # 动作空间
    def all_playable_cards(self, player_cards, last_hand):
        if last_hand is None:
            for cards_len in [10, 9, 8, 7, 6, 5, 4, 3, 2, 1]:
                for comb in combinations(player_cards, cards_len):
                    h = Hand(comb)
                    if h.is_valid():
                        return h
            return []

        if not last_hand.is_valid():
            return []
        
        last_type = last_hand.type
        last_len = len(last_hand.cards)
    
        playable = []
        unique_playable = []
        # R&B
        if PokerCard('Joker', 'small') in player_cards and PokerCard('Joker', 'big') in player_cards and last_type != '王炸':
            playable.append(Hand([PokerCard('Joker', 'small'), PokerCard('Joker', 'big')]))
            unique_playable.append(Hand([PokerCard('Joker', 'small'), PokerCard('Joker', 'big')]))
        if last_type != '炸弹' and last_type != '王炸':
            rank_count = {}
            for card in player_cards:
                rank_count[card.rank] = rank_count.get(card.rank, 0) + 1
            bomb_rank = []
            for k,v in rank_count.items():
                if v >= 4:
                    bomb_rank.append(k)
            for i in range(len(bomb_rank)):
                bomb_rank[i] = [x for x in player_cards if x.rank == bomb_rank[i]]
                comb = combinations(bomb_rank[i], 4)
                playable.extend([Hand(x) for x in list(comb)])
                unique_playable.extend([Hand(x) for x in list(set(comb))])
        # 同长度
        for comb in combinations(player_cards, last_len):
            h = Hand(comb)
            if not h.is_valid():
                continue
    
            if h > last_hand:
                if h.type == last_type and len(h.cards) == last_len:
                    playable.append(h)
    
        playable.sort()
        unique_playable_rank = []
        for i in range(len(playable)):
            if (c:=[x.rank for x in playable[i]]) not in unique_playable_rank:
                unique_playable.append(playable[i])
                unique_playable_rank.append(c)
        unique_playable.sort()
        return playable, unique_playable

    def generate_prompt(self, player: 'Player', action_type: str, game_state: Dict) -> str:
        """
        生成LLM提示
        
        :param player: 玩家对象
        :param action_type: 行动类型 ('call', 'double', 'play')
        :param game_state: 游戏状态字典
        :return: 提示字符串
        """
        prompt = f"你正在玩斗地主游戏，你是玩家：{player.name}"
        
        # 添加角色信息
        if action_type == "call": 
            prompt += "\n你的角色未定"
        else:
            if player.is_landlord:
                prompt += "\n你的角色是: 地主"
            else:
                prompt += f"\n你的角色是: {player.type}"
        # 添加游戏历史信息
        if game_state.get('history'):
            prompt += f"\n\n以下是游戏的对局信息: "
            for i, action in enumerate(game_state['history'],1):
                    prompt += f"\n{i}. {action}"
        # 添加手牌信息
        prompt += f"\n\n你的手牌是: {', '.join(card.str_zh() for card in sorted(player.hand))}"
        # ===========================================================================================================
        # 根据行动类型添加特定提示
        if action_type == "call":
            prompt += "\n\n现在是叫分阶段。你可以选择叫1分、2分、3分或者不叫(0分)。"
            prompt += '\n请使用json格式回复: {"CALL": <分数>}'
            prompt += '\n例如: {"CALL": 2} 表示叫2分'
            prompt += "\n注意: 分数必须是0-3的整数"
        
        elif action_type == "double": # 1. 农民加倍互相不知道 2. 首次加倍没有地主，地主只有再加倍
            prompt += "\n\n现在是加倍阶段。"
            if player.is_landlord: # 地主 （此时有农民加倍）
                if player.next_player.doubled:
                    if player.pre_player.doubled:
                        prompt += "\n上家农民和下家农民都选择加倍。"
                    else:
                        prompt += "\n下家农民选择加倍。"
                else:
                    prompt += "\n上家农民选择加倍。"
            prompt += "现在请你选择加倍或者不加倍。"
            prompt += '\n请使用json格式回复: {"DOUBLE": "<是/否>"}'
            prompt += '\n例如: {"DOUBLE": "是"} 表示选择加倍'
            prompt += "\n注意: 只能回答'是'或'否'"

        elif action_type == 'public':
            # 只能为地主
            if player.is_landlord:
                prompt += "\n请地主选择是否明牌。"
                prompt += '\n请使用json格式回复: {"PUBLIC": "<是/否>"}'
                prompt += '\n例如: {"PUBLIC": "是"} 表示选择加倍'
                prompt += "\n注意: 只能回答'是'或'否'"
        
        elif action_type == "play":
            self.must_play = False
            if game_state.get('last_played_by'): # 非第一次出牌
                last_hand_played_by = game_state['last_played_by']
                # 添加 ta 人手牌信息
                prompt += f"\n{player.pre_player.type} {player.pre_player.name} 剩余{len(player.pre_player.hand)}张手牌；{player.next_player.type} {player.next_player.name} 剩余{len(player.next_player.hand)}张手牌。"

                if game_state['pass_count'] == 0:
                    prompt += f"\n上一手牌是由 {last_hand_played_by.type} {last_hand_played_by.name} 出的。你此次出牌后的下一出牌者是 {player.next_player.type} {player.next_player.name}。" 
                elif game_state['pass_count'] == 1: # 上一个人没要
                    prompt += f"\n上一手牌是由 {last_hand_played_by.type} {last_hand_played_by.name} 出的，{player.pre_player.type} {player.pre_player.name} 没要。你此次出牌后的下一出牌者仍然是 {player.next_player.type} {player.next_player.name} 。" 
                elif game_state['pass_count'] == 2: # 没人压牌
                    prompt += "\n你的上一次出牌没人要得起，现在你可以再次出牌，且必须出牌。" 
                    
                if game_state.get('last_hand'): # 此时 pass_count!=2
                    last_hand = game_state['last_hand']
                    prompt += f"\n上一手牌是: {last_hand.type} ({', '.join([card.str_zh() for card in last_hand.cards])})"
                    prompt += "\n你需要出比上一手牌大的牌型"
                    if game_state['pass_count'] != 2:
                        prompt += "，或者选择不出。"
                    action_space = self.all_playable_cards(player.hand, last_hand)
                    if len(action_space) == 2 and action_space[1]:
                        action_space_str = ',\n'.join([f"[{', '.join(card.str_zh() for card in h)}]" for h in action_space[1]])
                        prompt += f'\n你可用的手牌组合为：{action_space_str}等等。'
                    else:
                        prompt += f'\n你目前没有可出的手牌组合，请直接 PASS。'
                        prompt += '\n\n请使用json格式回复: {"PLAY": "PASS"}'
                        return prompt
                if game_state['pass_count'] != 2:
                    prompt += '\n\n请从可用的手牌组合中选取一组打出，并使用json格式回复: {"PLAY": ["牌1", "牌2", ...]} 或 {"PLAY": "PASS"}'
                    prompt += '\n例如: {"PLAY": ["黑桃3"]} 或者 {"PLAY": ["小王", "大王"]} 或者 {"PLAY": ["方块J", "梅花J"]}'
                    prompt += '\n例如: {"PLAY": "PASS"} 表示不出'
                else:
                    self.must_play = True
                    prompt += '\n\n请从可用的手牌组合中选取一组打出，使用json格式回复: {"PLAY": ["牌1", "牌2", ...]}'
                    prompt += '\n例如: {"PLAY": ["黑桃3"]} 或者 {"PLAY": ["小王", "大王"]} 或者 {"PLAY": ["方块J", "梅花J"]}'

            else: # 第一次出牌
                self.must_play = True
                prompt += "\n\n你是第一个出牌的玩家，第一次出牌不能PASS。现在请你出牌。"
                prompt += '\n\n请使用json格式回复: {"PLAY": ["牌1", "牌2", ...]}'
                prompt += '\n例如: {"PLAY": ["黑桃3"]} 或者 {"PLAY": ["小王", "大王"]} 或者 {"PLAY": ["方块J", "梅花J"]}'
            prompt += "\n注意: 牌名必须与手牌中的牌的名称一致。请你在认真思考后做出决策："

        elif action_type == "feedback":
            # 添加 ta 人手牌信息
            prompt += f"\n{player.pre_player.type} {player.pre_player.name} 剩余{len(player.pre_player.hand)}张手牌；{player.next_player.type} {player.next_player.name} 剩余{len(player.next_player.hand)}张手牌。"
            
            play_count = game_state['whole_play_count']
            if play_count == 0: # 第一个出牌
                pass
            elif play_count == 1: # 第二个出牌
                last_player, last_player_hand = game_state["last_player&hand"] 
                prompt += '\n请你根据以上对局信息，评估上家（前一位出牌者）的出牌（包括PASS）对你当前局势的影响：'
                last_type = '队友' if player.type[-2:]==last_player.type[-2:] else '对手'
                prompt += f"\n上一手牌是由{last_type} {last_player.type} {last_player.name} 打出的：{last_player_hand.type} ({', '.join([card.str_zh() for card in last_player_hand.cards])})"
                prompt += '\n评估规则：为每项出牌在 [-5, 5] 区间给出整数评分： 5分：极大帮助（如：完美配合你的牌型、压制对手、为你创造主动权） 0分：无显著影响（如：无关牌型、未改变局势） -5分：极大威胁（如：破坏你的出牌计划、逼迫你拆解关键牌、助长对手优势）'
                prompt += '\n请使用JSON格式回复：{"last_player_impact": 上家出牌评分（整数）, "last_player_reason": "评分理由（1-2句话）"}'
                
            else:
                last_player, last_player_hand = game_state["last_player&hand"]
                last_last_player, last_last_player_hand = game_state["last_last_player&hand"] 
                prompt += '\n请你根据以上对局信息，评估上家（前一位出牌者）和上上家（前第二位出牌者）的出牌（包括PASS）对你当前局势的影响：'
                last_type = '队友' if player.type[-2:]==last_player.type[-2:] else '对手'
                last_last_type = '队友' if player.type[-2:]==last_last_player.type[-2:] else '对手'
                if last_player_hand:
                    prompt += f"\n上一手牌是由你的{last_type} {last_player.type} {last_player.name} 打出的：{last_player_hand.type} ({', '.join([card.str_zh() for card in last_player_hand.cards])})"
                else:
                    prompt += f"\n上一次出牌中，你的{last_type} {last_player.type} {last_player.name} 选择了PASS"
                if last_last_player_hand:
                    prompt += f"\n上上手牌是由你的{last_last_type} {last_last_player.type} {last_last_player.name} 打出的：{last_last_player_hand.type} ({', '.join([card.str_zh() for card in last_last_player_hand.cards])})"
                else:
                    prompt += f"\n上上次出牌中，你的{last_last_type} {last_last_player.type} {last_last_player.name} 选择了PASS"
                    
                prompt += '\n评估规则：为每项出牌在 [-5, 5] 区间给出整数评分： 5分：极大帮助（如：完美配合你的牌型、压制对手、为你创造主动权） 0分：无显著影响（如：无关牌型、未改变局势） -5分：极大威胁（如：破坏你的出牌计划、逼迫你拆解关键牌、助长对手优势）'
                prompt += '\n请使用JSON格式回复：{"last_player_impact": 上家出牌评分（整数）, "last_player_reason": "评分理由（1-2句话）", "second_last_player_impact": 上上家出牌评分（整数）, "second_last_player_reason": "评分理由（1-2句话）"}'
            prompt += '\n请给出评估：'

        return prompt


    def generate_complete_info_prompt(self, player: 'Player', action_type: str, game_state: Dict) -> str:
        prompt = '\n系统直接告知你其他玩家的手牌：'
        if action_type == 'call':
            prompt += f"\n你的上家 {player.pre_player.name} 的手牌为：{', '.join(card.str_zh() for card in sorted(player.pre_player.hand))}"
            prompt += f"\n你的下家 {player.next_player.name} 的手牌为：{', '.join(card.str_zh() for card in sorted(player.next_player.hand))}"
        else:
            pre_type = '队友' if player.type[-2:]==player.pre_player.type[-2:] else '对手'
            last_type = '队友' if player.type[-2:]==player.next_player.type[-2:] else '对手'
            prompt += f"\n你的{pre_type} {player.pre_player.type} {player.pre_player.name} 的手牌为：{', '.join(card.str_zh() for card in sorted(player.pre_player.hand))}"
            prompt += f"\n你的{last_type} {player.next_player.type} {player.next_player.name} 的手牌为：{', '.join(card.str_zh() for card in sorted(player.next_player.hand))}"
        prompt += "\n现在，请你在具有完整信息的情况下重新给出决策："

        return prompt

    def extract_last_json_dict(self, text):
        pattern = r'\{[^{}]*\}'
        matches = re.findall(pattern, text)
        
        if not matches: return None
        candidate = matches[-1]
        try:
            return json.loads(candidate)
        except JSONDecodeError:
            try:
                fixed = candidate.replace('\'','\"')
                return json.loads(fixed)
            except JSONDecodeError:
                pass
        return None
    
    def parse_response(self, response: str, action_type: str, player: 'Player') -> Any:
        """
        解析LLM响应
        
        :param response: LLM响应文本
        :param action_type: 行动类型
        :param player: 玩家对象
        :return: 解析后的决策结果
        """
        response = response.strip().upper()
        
        try:
            if action_type == "call":
                decision_json = self.extract_last_json_dict(response)
                call_value = int(decision_json['CALL'])
                if call_value in [0, 1, 2, 3]:
                    return call_value
                else:
                    print(f'决策：CALL 不明->{call_value}')
                    return None
            
            elif action_type == "double":
                decision_json = self.extract_last_json_dict(response)
                if_double = decision_json['DOUBLE']
                if if_double == '是':
                    return True
                elif if_double == '否':
                    return False
                print(f'决策：DOUBLE 不明->{if_double}')
                return None

            elif action_type == 'public':
                decision_json = self.extract_last_json_dict(response)
                if_public = decision_json['PUBLIC']
                if if_public == '是':
                    return True
                elif if_public == '否':
                    return False
                print(f'决策：PUBLIC 不明->{if_public}')
                return None
            # 不出牌返回[]，否则返回Hand
            elif action_type == "play": # 返回Hand
                decision_json = self.extract_last_json_dict(response)
                card_str_list = decision_json['PLAY']
                if card_str_list == 'PASS':
                    return []
                try:
                    card_list = []
                    name_map_dict = PokerCard.SUIT_SYMBOLS_ZH_R
                    for card_str in card_str_list:
                        if '小王' in card_str:
                            card_list.append(PokerCard('Joker', 'small'))
                        elif '大王' in card_str:
                            card_list.append(PokerCard('Joker', 'big'))
                        else:
                            card_list.append(PokerCard(name_map_dict[card_str[:2]], card_str[2:].upper()))
                    if card_list:
                        return Hand(card_list)
                    else:
                        return []
                except:
                    print(f'决策：PLAY 不明->{card_str_list}')
                    return []
            elif action_type == "feedback":
                decision_json = self.extract_last_json_dict(response)
                return decision_json
        
        except Exception as e:
            print(f"解析响应时出错: {e}")
            return None

    
    def get_decision(self, player: 'Player', action_type: str, game_state: Dict) -> Any:
        """
        获取玩家决策
        
        :param player: 玩家对象
        :param action_type: 行动类型
        :param game_state: 游戏状态
        :messages: 对话全文
        :return: 决策结果
        """
        prompt = self.generate_prompt(player, action_type, game_state)
        if game_state['debugging']:
            print(f"\n[{player.name} 输入]: {prompt}")
        player.updata_messages("user", prompt)
        messages = [
            {"role": "system", "content": self.system_prompt},
            player.all_messages[-1]
        ]
        
        retry_count = 0
        while retry_count < self.max_retries:
            if len(messages)>2 and game_state['debugging']:
                print(messages[-1]['content'])
            try:
                # 调用 API
                response = self._generate('', messages, player.model_name)
                if game_state['debugging']:
                    print(f"[{player.name} 响应]: {response}")

                # 解析响应
                decision = self.parse_response(response, action_type, player)
                if game_state['debugging']:
                    print(f"[{player.name} 决策]: {decision}")
                if action_type == 'play' and self.must_play and not decision:
                    print(f"{player.name} 必须出牌但未出")
                    raise ValueError("必须出牌")
                    
                player.updata_messages("assistant", response)
                messages.append({"role": "assistant", "content": response})
                # 信息对称 complete information
                if game_state["complete_info_judge"] and action_type != "feedback":
                    complete_info_prompt = self.generate_complete_info_prompt(player, action_type, game_state)
                    complete_info_response = self._generate('', messages+[{"role": "user", "content": complete_info_prompt}], player.model_name)
                    if game_state['debugging']:
                        print(f"[{player.name} 完全信息响应]: {complete_info_response}")

                # 验证决策
                if decision is None:
                    raise ValueError("无法解析响应")
                
                # 对于出牌行动，验证牌是否有效
                if action_type == "play" and decision:
                    # 是否有效
                    if decision.type == Hand.INVALID:
                        new_prompt = '你所出牌的牌型无效，请重新出牌！'
                        messages.append({"role": "user", "content": new_prompt})
                        player.updata_messages("user", new_prompt) 
                        raise ValueError(f"出牌无效：{decision} ")
                    else:
                        if game_state['debugging']:
                            print('🎴牌型有效')
                    # 检查所有牌是否在玩家手牌中
                    for card in decision.cards:
                        if card not in player.hand:
                            new_prompt = f'你所出牌中，牌 {card} 不在手牌内，请重新出牌！'
                            messages.append({"role": "user", "content": new_prompt})
                            player.updata_messages("user", new_prompt) 
                            raise ValueError(f"牌 {card} 不在玩家手牌中")
                    # 检查出牌牌型是否与上家相同，检查出牌是否大于上家
                    if game_state.get('last_hand'):
                        if decision.type != game_state['last_hand'].type:
                            # 除了炸弹、王炸
                            if decision.type not in [Hand.ROCKET, Hand.BOMB]:
                                new_prompt = '你所出牌的牌型与上家不同，请重新出牌！'
                                messages.append({"role": "user", "content": new_prompt})
                                player.updata_messages("user", new_prompt) 
                                raise ValueError(f"牌 {decision} 牌型与上家不同")
                        elif decision > game_state['last_hand']:
                            if game_state['debugging']:
                                print('🎴牌型检查通过')
                        else:
                            new_prompt = '你所出牌未大于上家，请重新出牌！'
                            messages.append({"role": "user", "content": new_prompt})
                            player.updata_messages("user", new_prompt) 
                            raise ValueError(f"牌 {decision} 小于等于上家")
                    ## 必须出牌的情况
                    if not decision:
                        if game_state['pass_count'] == 2:
                            new_prompt = '你的上次出牌没人要，这次你必须出牌！'
                            messages.append({"role": "user", "content": new_prompt})
                            player.updata_messages("user", new_prompt) 
                            raise ValueError(f"{player.name} 必须出牌")
                        elif game_state['last_player_index'] == -1:
                            new_prompt = '开局第一手必须出牌，请重新抉择！'
                            messages.append({"role": "user", "content": new_prompt})
                            player.updata_messages("user", new_prompt) 
                            raise ValueError(f"{player.name} 开局没出牌")
                        else:
                            if game_state['debugging']:
                                print('🎴允许不出')
                
                return decision
            
            except Exception as e:
                player.error_num += 1
                print(f"决策出错 ({player.name}, 重试 {retry_count+1}/{self.max_retries}): {e}")
                retry_count += 1
                time.sleep(self.retry_delay)
        
        # 达到最大重试次数后使用默认决策
        print(f"达到最大重试次数，使用默认决策 ({player.name})")
        
        if action_type == "call":
            return 0
        elif action_type == "double":
            return False
        elif action_type == "public":
            return False
        elif action_type == "play":
            last_hand = game_state.get('last_hand')
            if game_state.get('last_hand'): # 此时 pass_count!=2
                action_space = self.all_playable_cards(player.hand, last_hand)
                if action_space[1]:
                    print(f"默认决策: ({action_space[1][0]})")
                    return action_space[1][0]
                else:
                    print("默认决策: ([])")
                    return []
            else:
                default_play = self.all_playable_cards(player.hand, None)
                print(f"默认决策: ({default_play})")
                return default_play
            

    def get_feedback(self, player: 'Player', action_type: str, game_state: Dict) -> Any:
        """获取玩家对前两个玩家的出牌反馈"""
        prompt = self.generate_prompt(player, action_type, game_state)
        if game_state['debugging']:
            print(f"\n[{player.name} 输入]: {prompt}")
        messages = [
            {"role": "system", "content": self.system_prompt},
            {"role": "user", "content": prompt}
        ]
        response = self._generate('', messages, player.model_name)
        feedback = self.parse_response(response, action_type, player)
        if game_state['debugging']:
            print(f"[{player.name} 反馈]: {feedback}")
        return feedback