import os
import asyncio
import json
import re
import requests
import json
import ast
from typing import Dict, Literal, List, Callable
from pydantic import BaseModel, ValidationError
from autogen_agentchat.agents import AssistantAgent
from autogen_agentchat.messages import TextMessage
from autogen_core import CancellationToken
from autogen_ext.models.openai import OpenAIChatCompletionClient
# Load API keys
OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
PAGODA_API_KEY = os.getenv("PAGODA_API_KEY")

# Define constants for moves and roles to avoid hardcoding strings.
OPERA = "O"
FOOTBALL = "F"
MAN = "M"
WOMAN = "W"


def debug_print(msg: str):
    try:
        json_str_match = re.search(r'\{.*\}', msg, re.DOTALL)
        if json_str_match:
            json_str = json_str_match.group(0)
            data = ast.literal_eval(json_str)
            prefix = msg[:msg.find(json_str)]
            print(f"[DEBUG] {prefix}\n{json.dumps(data, indent=4)}")
        else:
            print(f"[DEBUG] {msg}")
    except (ValueError, SyntaxError):
        print(f"[DEBUG] {msg}")

# Response format
class AgentResponse(BaseModel):
    move: Literal[OPERA, FOOTBALL]
    prediction: Literal[OPERA, FOOTBALL, "None"]
    reasoning: str


class BoS:
    def __init__(
        self,
        model: str,
        role: str,
        prediction: bool,
        version: str,
        temperature: float,
        game_id: int,
        opponent_strategy_fn: Callable[[List[Dict]], str],
        strategy: bool = False,
        total_rounds: int = 10,
        max_retries: int = 10
    ):
        self.debug = True
        self.model = model
        self.role = role.lower()
        self.prediction = prediction
        self.version = version
        self.temperature = temperature
        self.game_id = game_id
        self.strategy = strategy
        self.total_rounds = total_rounds
        self.max_retries = max_retries
        self.history: List[Dict] = []
        self.player_score_game = 0
        self.prediction_score = 0
        self.opponent_strategy_fn = opponent_strategy_fn

        # Class attributes for moves and roles
        self.OPERA_MOVE = OPERA
        self.FOOTBALL_MOVE = FOOTBALL
        self.MAN_ROLE = MAN
        self.WOMAN_ROLE = WOMAN

        # Payoff matrix
        if self.version == "classic":
            self.A, self.B, self.C = 3, 2, 0
        else:
            self.A, self.B, self.C = float('nan'), float('nan'), float('nan')

        self.base_url = (
            "https://api.openai.com/v1"
            if model.startswith("gpt")
            else "https://ollama-ui.pagoda.liris.cnrs.fr/ollama/api/generate"
            if ":" in model
            else "http://localhost:11434/v1"
        )

        self.model_client = OpenAIChatCompletionClient(
            timeout=60,
            model=self.model,
            base_url=self.base_url,
            api_key=OPENAI_API_KEY,
            model_info={
                "temperature": self.temperature,
                "function_calling": True,
                "parallel_tool_calls": True,
                "family": "unknown",
                "json_output": True,
                "vision": False
            },
            response_format=AgentResponse
        )

    async def play_round(self, round_id: int) -> Dict:
        opponent_move = self.opponent_strategy_fn(self.history)

        if self.strategy:
            move, prediction, reasoning, instruction = self.apply_strategy(opponent_move)
        else:
            move, prediction, reasoning, instruction = await self.model_based_decision()

        outcome = self.determine_outcome(move, opponent_move)
        self.update_score(outcome)

        prediction_current_score = 0.0
        if self.prediction and prediction in [self.OPERA_MOVE, self.FOOTBALL_MOVE]:
            if prediction == opponent_move:
                prediction_current_score = 1.0
                self.prediction_score += 1

        round_result = {
            "Agent Move": move,
            "Prediction": prediction,
            "Opponent Move": opponent_move,
            "Reasoning": reasoning,
            "Outcome": outcome,
            "Current Player Prediction Score Game": self.prediction_score,
            "PredictionOutcome": prediction_current_score
        }

        self.history.append(round_result)
        debug_print(f"Round {round_id}: {instruction}")
        debug_print(f"Round {round_id}: {round_result}")
        return round_result

    def generate_instruction(self, history_summary: str, round_id: int) -> str:
        base = f"""
You are playing a coordination game.

Game Description:
A couple is deciding how to spend the evening. Player {self.WOMAN_ROLE.capitalize()} prefers {self.OPERA_MOVE}, while Player {self.MAN_ROLE.capitalize()} prefers {self.FOOTBALL_MOVE}.
Both would rather go to the same event together than go alone, but each has a different preferred activity.

Payoffs:
- {self.OPERA_MOVE}/{self.OPERA_MOVE}: {self.WOMAN_ROLE.capitalize()} gets {self.A}, {self.MAN_ROLE.capitalize()} gets {self.B}
- {self.FOOTBALL_MOVE}/{self.FOOTBALL_MOVE}: {self.WOMAN_ROLE.capitalize()} gets {self.B}, {self.MAN_ROLE.capitalize()} gets {self.A}
- Mismatch: Both get {self.C}

Your Role: {self.role.capitalize()}
This is round {round_id} of {self.total_rounds}.
Game History:
{history_summary}
"""
        if not self.prediction:
            return base + f"""
Your Goal: Maximize your own score by anticipating the opponent’s move — whether it is random, pattern-based, or strategic — and by seeking coordination when it can lead to mutually beneficial outcomes.

Respond ONLY in the following JSON format:
{{
  "move": "{self.OPERA_MOVE}" | "{self.FOOTBALL_MOVE}",
  "prediction": "None",
  "reasoning": "Explain your decision based on your preferences and the past moves"
}}
"""
        return base + f"""
Your Goal: Maximize your own score by anticipating the opponent’s move — whether it is random, pattern-based, or strategic — and by seeking coordination when it can lead to mutually beneficial outcomes.

Respond ONLY in the following JSON format:
{{
  "move": "{self.OPERA_MOVE}" | "{self.FOOTBALL_MOVE}",
  "prediction": "{self.OPERA_MOVE}" | "{self.FOOTBALL_MOVE}",
  "reasoning": "Explain how you predicted the opponent's move and how you chose your response"
}}
"""

    async def model_based_decision(self) -> (str, str, str, str):
        history_summary = self.get_history_summary()
        instruction = self.generate_instruction(history_summary, len(self.history) + 1)

        if ":" in self.model:
            return await self.run_pagoda(instruction)

        for attempt in range(1, self.max_retries + 1):
            try:
                agent = AssistantAgent(
                    name="Player",
                    model_client=self.model_client,
                    system_message="You are a helpful assistant."
                )
                response = await agent.on_messages(
                    [TextMessage(content=instruction, source="user")],
                    cancellation_token=CancellationToken()
                )
                content = response.chat_message.content
                agent_response = AgentResponse.model_validate_json(content)
                return agent_response.move, agent_response.prediction, agent_response.reasoning, instruction
            except (ValidationError, json.JSONDecodeError) as e:
                debug_print(f"Attempt {attempt}: Parse error - {e}")

        raise ValueError("Model failed to provide a valid response after multiple attempts.")

    async def run_pagoda(self, instruction: str) -> (str, str, str, str):
        headers = {
            "Authorization": f"Bearer {PAGODA_API_KEY}",
            "Content-Type": "application/json"
        }
        payload = {
            "model": self.model,
            "temperature": self.temperature,
            "prompt": instruction,
            "stream": False
        }

        for attempt in range(1, self.max_retries + 1):
            try:
                response = requests.post(self.base_url, headers=headers, json=payload)
                response.raise_for_status()
                raw_response = response.json().get("response", "")
                parsed_json = self.extract_json_from_response(raw_response)
                if parsed_json:
                    agent_response = AgentResponse(**parsed_json)
                    return agent_response.move, agent_response.prediction, agent_response.reasoning, instruction
                debug_print(f"Attempt {attempt}: Could not parse JSON from: {raw_response}")
            except Exception as e:
                debug_print(f"Attempt {attempt}: Pagoda error - {e}")

        raise ValueError("Pagoda API failed after multiple attempts.")

    def extract_json_from_response(self, text: str) -> dict:
        try:
            match = re.search(r"\{.*\}", text, re.DOTALL)
            if match:
                return json.loads(match.group())
        except Exception as e:
            debug_print(f"JSON extract error: {e}")
        return {}

    def determine_outcome(self, player_move: str, opponent_move: str) -> int:
        if player_move == opponent_move:
            return self.A if (player_move == self.FOOTBALL_MOVE) == (self.role == self.MAN_ROLE) else self.B
        return self.C

    def apply_strategy(self, opponent_move: str) -> (str, str, str):
        return "None", "None", "None"


    def update_score(self, outcome: int):
        self.player_score_game += outcome

    def get_history_summary(self) -> str:
        if not self.history:
            return "No previous rounds."
        lines = [
            f"Round {i + 1}: You chose {r['Agent Move']}, You predicted {r['Prediction']} and Opponent chose {r['Opponent Move']}. Round score: {r['Outcome']}"
            for i, r in enumerate(self.history)
        ]
        return "\n".join(lines) + f"\nTotal Playing Score: {self.player_score_game}\nCorrect Predictions: {self.prediction_score}/{len(self.history)}"

# Runner
async def main():
    total_rounds = 10
    game = BoS(
        model="qwen3",
        role=MAN,
        prediction=True,
        version="classic",
        temperature=0.7,
        game_id=1,
        opponent_strategy_fn=lambda history: OPERA if len(history) % 2 == 0 else FOOTBALL,
        strategy=False,
        total_rounds=total_rounds
    )
    for round_id in range(1, total_rounds + 1):
        await game.play_round(round_id)

    print(f"Final Score: {game.player_score_game}")
    print(f"Correct Predictions: {game.prediction_score}/{total_rounds}")
    accuracy = game.prediction_score / total_rounds * 100
    print(f"Prediction Accuracy: {accuracy:.1f}%")

if __name__ == "__main__":
    asyncio.run(main())