import os
import asyncio
import json
import re
import requests
from typing import Dict, Literal, List, Callable
from pydantic import BaseModel, ValidationError
from autogen_agentchat.agents import AssistantAgent
from autogen_agentchat.messages import TextMessage
from autogen_core import CancellationToken
from autogen_ext.models.openai import OpenAIChatCompletionClient

# Load API keys
OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
PAGODA_API_KEY = os.getenv("PAGODA_API_KEY")
if not OPENAI_API_KEY:
    raise ValueError("Missing OPENAI_API_KEY. Set it as an environment variable.")
if not PAGODA_API_KEY:
    raise ValueError("Missing PAGODA_API_KEY. Set it as an environment variable.")

class Move(BaseModel):
    move: Literal["O", "F"]
    prediction: Literal["O", "F"]
    reasoning: str

class Message(BaseModel):
    sender: Literal["M", "W"]
    message: str

class Player:
    def __init__(
        self,
        model: str,
        negotiation_role: str,
        game_role: str,
        version: str,
        temperature: float,
        total_messages: int,
        total_rounds: int = 10,
        max_retries: int = 10
    ):
        self.debug = False
        self.model = model
        self.negotiation_role = negotiation_role.lower()
        self.game_role = game_role.lower()
        self.version = version
        self.temperature = temperature
        self.total_messages = total_messages
        self.total_rounds = total_rounds
        self.max_retries = max_retries

        self.negotiation_history: List[Dict] = []
        self.game_history: List[Dict] = []
        self.total_payoff = 0
        self.prediction_score = 0

        if self.version == "classic":
            self.A, self.B, self.C = 3, 2, 0
        else:
            self.A, self.B, self.C = int('nan'), int('nan'), int('nan')

        self.base_url = (
            "https://api.openai.com/v1"
            if model.startswith("gpt") or "o3" in self.model
            else "https://ollama-ui.pagoda.liris.cnrs.fr/ollama/api/generate"
            if ":" in model
            else "http://localhost:11434/v1"
        )

        self.model_gamer_client = OpenAIChatCompletionClient(
            timeout=60,
            model=self.model,
            base_url=self.base_url,
            api_key=OPENAI_API_KEY,
            model_info={
                "temperature": self.temperature,
                "function_calling": True,
                "parallel_tool_calls": True,
                "family": "unknown",
                "json_output": True,
                "vision": False
            },
            response_format=Move
        )

        self.model_negotiator_client = OpenAIChatCompletionClient(
            timeout=60,
            model=self.model,
            base_url=self.base_url,
            api_key=OPENAI_API_KEY,
            model_info={
                "temperature": self.temperature,
                "function_calling": True,
                "parallel_tool_calls": True,
                "family": "unknown",
                "json_output": True,
                "vision": False
            },
            response_format=Message
        )



    def debug_print(self, msg: str):
        if self.debug:
            print(f"[DEBUG] {msg}")

    def generate_game_instruction(self, negotiation_summary: str, history_summary: str, round_id: int) -> str:
        base = f"""
You are playing a coordination game

Game Description:
Two people is deciding how to spend the evening. W prefers O, while M prefers F.
Both would rather go to the same event together than go alone, but each has a different preferred activity.

Payoff Rules:
- If both choose O: W receives {self.A} points, and M receives {self.B} points.
- If both choose F: W receives {self.B} points, and M receives {self.A} points.
- If they choose different activities (one chooses O and the other chooses F): both receive {self.C} points.

Your Role: {self.game_role.capitalize()}

Negotiation History:
{negotiation_summary}

Game History:
{history_summary}

This is round {round_id} of {self.total_rounds} in the game.

Your Goal: Maximize your own score by anticipating the opponent's move and by seeking coordination when it can lead to mutually beneficial outcomes.

Respond ONLY in the following JSON format:
{{
  "move": "O" | "F",
  "prediction": "O" | "F",
  "reasoning": "Explain how you predicted the opponent's move and how you chose your response"
}}
"""
        return base


    def generate_negotiation_instruction(self, negotiation_summary: str, round_id: int) -> str:
            base = f"""
You are playing a coordination game that involves a distributional conflict.

Game Description:
Two people is deciding how to spend the evening. W prefers O, while M prefers F.
Both would rather go to the same event together than go alone, but each has a different preferred activity.

Payoff Rules:
- If both choose O: W receives {self.A} points, and M receives {self.B} points.
- If both choose F: W receives {self.B} points, and M receives {self.A} points.
- If they choose different activities (one chooses O and the other chooses F): both receive {self.C} points.

Your Role: {self.game_role.capitalize()}

Your Goal: Maximize your own score by anticipating the opponent's move and by seeking coordination when it can lead to mutually beneficial outcomes.

You can discuss and negotiate with the other player to maximize the reward you can obtain before playing {self.total_rounds} rounds of the game. 

This is your turn to send message #{round_id} out of {self.total_messages} total allowed messages in the negotiation phase.

Negotiation History:
{negotiation_summary}

Respond ONLY in the following JSON format:
{{
    "sender": "{self.game_role}",
    "message": "Explain how you can coordinate to reach mutually beneficial outcomes."
}}
"""
            return base


    async def play_round(self) -> (str, str, str):
        round_id = len(self.game_history) + 1
        negotiation_summary = self.get_negotiation_summary()
        history_summary = self.get_history_summary()
        instruction = self.generate_game_instruction(negotiation_summary, history_summary, round_id)
        self.debug_print(f"\n=== GAME ROUND {round_id} ({self.game_role.upper()}) ===")
        #self.debug_print("Instruction sent to model:")
        #self.debug_print(instruction)
        if ":" in self.model:
            return await self.run_pagoda_for_playing(instruction)
        for attempt in range(1, self.max_retries + 1):
            try:
                agent = AssistantAgent(
                    name="Player",
                    model_client=self.model_gamer_client,
                    system_message="You are a helpful assistant."
                )
                response = await agent.on_messages(
                    [TextMessage(content=instruction, source="user")],
                    cancellation_token=CancellationToken()
                )
                content = response.chat_message.content
                #self.debug_print(f"Raw model output:\n{content}")
                agent_response = Move.model_validate_json(content)
                self.debug_print(f"Game Round {round_id} {self.game_role}  plays {agent_response.move}, predicts {agent_response.prediction},  since {agent_response.reasoning}")
                return agent_response.move, agent_response.prediction, agent_response.reasoning
            except (ValidationError, json.JSONDecodeError) as e:
                self.debug_print(f"Attempt {attempt}: Failed to parse response - {e}")
        raise ValueError("Model failed to provide a valid response after multiple attempts.")


    async def negotiate(self) -> (str, str):
        round_id = len(self.negotiation_history) + 1
        negotiation_summary = self.get_negotiation_summary()
        instruction = self.generate_negotiation_instruction(negotiation_summary, round_id)
        self.debug_print(f"\n=== NEGOTIATION ROUND {round_id} ({self.game_role.upper()}) ===")
        self.debug_print("Instruction sent to model:")
        self.debug_print(instruction)
        if ":" in self.model:
            return await self.run_pagoda_for_negotiating(instruction)
        for attempt in range(1, self.max_retries + 1):
            try:
                agent = AssistantAgent(
                    name="Player",
                    model_client=self.model_negotiator_client,
                    system_message="You are a helpful assistant."
                )
                response = await agent.on_messages(
                    [TextMessage(content=instruction, source="user")],
                    cancellation_token=CancellationToken()
                )
                content = response.chat_message.content
                self.debug_print(f"Raw model output:\n{content}")
                agent_response = Message.model_validate_json(content)
                self.debug_print(f"Negotiation Round {round_id} {agent_response.sender}  sends messages {agent_response.message}")
                return agent_response.sender, agent_response.message
            except (ValidationError, json.JSONDecodeError) as e:
                self.debug_print(f"Attempt {attempt}: Failed to parse response - {e}")
        raise ValueError("Model failed to provide a valid response after multiple attempts.")


    async def run_pagoda_for_playing(self, instruction: str) -> (str, str, str):
        headers = {
            "Authorization": f"Bearer {PAGODA_API_KEY}",
            "Content-Type": "application/json"
        }
        payload = {
            "model": self.model,
            "temperature": self.temperature,
            "prompt": instruction,
            "stream": False
        }
        for attempt in range(1, self.max_retries + 1):
            try:
                response = requests.post(self.base_url, headers=headers, json=payload)
                response.raise_for_status()
                raw_response = response.json().get("response", "")
                parsed_json = self.extract_json_from_response(raw_response)
                if parsed_json:
                    agent_response = Move(**parsed_json)
                    return agent_response.move, agent_response.prediction, agent_response.reasoning
                #self.debug_print(f"Attempt {attempt}: Could not parse JSON from: {raw_response}")
            except Exception as e:
                self.debug_print(f"Attempt {attempt}: Pagoda error - {e}")
        raise ValueError("Pagoda API failed after multiple attempts.")

    async def run_pagoda_for_negotiating(self, instruction: str) -> (str, str, str):
        headers = {
            "Authorization": f"Bearer {PAGODA_API_KEY}",
            "Content-Type": "application/json"
        }
        payload = {
            "model": self.model,
            "temperature": self.temperature,
            "prompt": instruction,
            "stream": False
        }

        for attempt in range(1, self.max_retries + 1):
            try:
                response = requests.post(self.base_url, headers=headers, json=payload)
                response.raise_for_status()
                raw_response = response.json().get("response", "")
                parsed_json = self.extract_json_from_response(raw_response)
                if parsed_json:
                    agent_response = Message(**parsed_json)
                    return agent_response.sender, agent_response.message
                #self.debug_print(f"Attempt {attempt}: Could not parse JSON from: {raw_response}")
            except Exception as e:
                self.debug_print(f"Attempt {attempt}: Pagoda error - {e}")
        raise ValueError("Pagoda API failed after multiple attempts.")


    def extract_json_from_response(self, text: str) -> dict:
        try:
            match = re.search(r"\{.*\}", text, re.DOTALL)
            if match:
                return json.loads(match.group())
        except Exception as e:
            self.debug_print(f"JSON extract error: {e}")
        return {}


    def determine_outcome(self, player_move: str, opponent_move: str) -> int:
        # If both players made the same move
        if player_move == opponent_move:
            # The player gets A if it's their preferred option
            if (player_move == "F" and self.game_role == "m") or (player_move == "O" and self.game_role == "w"):
                return self.A
            else:
                return self.B
        # If the players made different moves (coordination failed)
        return self.C


    def update_score(self, outcome: int):
        self.total_payoff += outcome

    def get_history_summary(self) -> str:
        if not self.game_history:
            return "No previous game rounds."
        lines = [
            f"Round {i + 1}: You chose {r['Agent Move']}, Opponent chose {r['Opponent Move']}. Score: {r['Outcome']}"
            for i, r in enumerate(self.game_history)
        ]
        return "\n".join(lines) + f"\nTotal Playing Score: {self.total_payoff}\nCorrect Predictions: {self.prediction_score}/{len(self.game_history)}"

    def get_negotiation_summary(self) -> str:
        if not self.negotiation_history:
            return "No previous negotiation rounds."
        lines = [
            f"Round {i + 1}: {r['Sender']} send message: {r['Message']}."
            for i, r in enumerate(self.negotiation_history)
        ]
        return "\n".join(lines)

role_prompt = """You are {role} in a coordination game with your partner. You need to choose between going to F or O..."""
# où {role} sera 'M' ou 'W'


# Runner
async def main():
    total_rounds = 10
    man = Player(
        model="qwen3",
        negotiation_role="initiator",
        game_role="man",
        version="classic",
        temperature=0.7,
        total_messages=0,
        total_rounds=total_rounds
    )
    woman = Player(
        model="qwen3",
        negotiation_role="responder",
        game_role="woman",
        version="classic",
        temperature=0.7,
        total_messages=0,
        total_rounds=total_rounds
    )

    for round_id in range(1, total_rounds + 1):
        (man_move, man_prediction, man_reasoning), (woman_move, woman_prediction, woman_reasoning) = await asyncio.gather(
            man.play_round(),
            woman.play_round()
        )

        man_score = man.determine_outcome(man_move, woman_move)
        woman_score = woman.determine_outcome(woman_move, man_move)

        man.update_score(man_score)
        woman.update_score(woman_score)

        if man_prediction == woman_move:
            man.prediction_score += 1
        if woman_prediction == man_move:
            woman.prediction_score += 1

        man.game_history.append({
            "Round": round_id,
            "Agent Move": man_move,
            "Opponent Move": woman_move,
            "Outcome": man_score
        })
        woman.game_history.append({
            "Round": round_id,
            "Agent Move": woman_move,
            "Opponent Move": man_move,
            "Outcome": woman_score
        })


        print(f"\n🔄 Round {round_id} Results:")
        print(f"👨 Man: Move={man_move}, Prediction={man_prediction}, Score={man_score}")
        print(f"   Reasoning: {man_reasoning}")
        print(f"👩 Woman: Move={woman_move}, Prediction={woman_prediction}, Score={woman_score}")
        print(f"   Reasoning: {woman_reasoning}")

        print(f"✅ Prediction Accuracy So Far:")
        print(f"   Man: {man.prediction_score}/{round_id} ({man.prediction_score / round_id * 100:.1f}%)")
        print(f"   Woman: {woman.prediction_score}/{round_id} ({woman.prediction_score / round_id * 100:.1f}%)")
        print(f"🎯 Total Scores: Man={man.total_payoff}, Woman={woman.total_payoff}")

    print(f"\n🏁 Final Results")
    print(f"Total Score: Man = {man.total_payoff}, Woman = {woman.total_payoff}")
    print(f"Prediction Accuracy:")
    print(f"  Man = {man.prediction_score}/{total_rounds} ({man.prediction_score / total_rounds * 100:.1f}%)")
    print(f"  Woman = {woman.prediction_score}/{total_rounds} ({woman.prediction_score / total_rounds * 100:.1f}%)")

if __name__ == "__main__":
    asyncio.run(main())