import os
import asyncio
import csv
import random
import re
import json
import requests
import boto3
from typing import Dict, Literal, List, Callable
from pydantic import BaseModel, ValidationError
from autogen_agentchat.agents import AssistantAgent
from autogen_agentchat.messages import TextMessage
from autogen_core import CancellationToken
from autogen_ext.models.openai import OpenAIChatCompletionClient

# Load API keys from environment variables
###################
#OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
OPENAI_API_KEY = "cle"
###################
#PAGODA_API_KEY = os.getenv("PAGODA_API_KEY")
PAGODA_API_KEY = "cle"
###################
AWS_ACCESS_KEY_ID = "cle"
AWS_SECRET_ACCESS_KEY = "cle"

if not OPENAI_API_KEY:
    raise ValueError("Missing OPENAI_API_KEY. Set it as an environment variable.")
if not PAGODA_API_KEY:
    raise ValueError("Missing PAGODA_API_KEY. Set it as an environment variable.")
if not AWS_ACCESS_KEY_ID:
    raise ValueError("Missing AWS_ACCESS_KEY_ID. Set it as an environment variable.")

CSV_FILE_PATH = "../../data/mp/mp_claude37.csv"

# Define the expected response format as a Pydantic model
class AgentResponse(BaseModel):
    move: Literal["Head", "Tail"]
    prediction: Literal["Head", "Tail", "None"]
    reasoning: str


class MP:
    def __init__(self, model: str, prediction: bool, temperature: float, game_id: int, opponent_strategy_fn: Callable[[List[Dict]], str], strategy=False, max_retries: int = 3):
        self.model = model
        self.temperature = temperature
        self.game_id = game_id
        self.strategy = strategy
        self.max_retries = max_retries
        self.history: List[Dict] = []
        self.player_score_game = 0
        self.opponent_strategy_fn = opponent_strategy_fn
        self.prediction = prediction
        self.prediction_score = 0

        is_openai_model = model.startswith("gpt")
        is_claude_model = model.startswith("aws-claude")
        is_pagoda_model = ":" in model

        self.base_url = (
            "https://api.openai.com/v1" if is_openai_model else
            "https://ollama-ui.pagoda.liris.cnrs.fr/ollama/api/generate" if is_pagoda_model else
            "http://localhost:11434/v1"
        )
        if is_claude_model:
            self.bedrock_client = boto3.client("bedrock-runtime", region_name="eu-west-3")
            if model == "aws-claude-3-haiku":
                self.bedrock_model_id = "eu.anthropic.claude-3-haiku-20240307-v1:0"
            elif model == "aws-claude-3-5-sonnet":
                self.bedrock_model_id = "eu.anthropic.claude-3-5-sonnet-20240620-v1:0"
            else:
                self.bedrock_model_id = "eu.anthropic.claude-3-7-sonnet-20250219-v1:0"

        model_info = {
            "temperature": self.temperature,
            "function_calling": True,
            "parallel_tool_calls": True,
            "family": "unknown",
            "json_output": True,
            "structured_output": True,
            "vision": False
        }

        self.model_client = OpenAIChatCompletionClient(
            timeout=60,
            model=self.model,
            base_url=self.base_url,
            api_key=OPENAI_API_KEY,
            model_info=model_info,
            response_format=AgentResponse
        )

    async def play_round(self, round_id: int, nb_rounds: int) -> Dict:
        opponent_move = self.opponent_strategy_fn(self.history)
        if self.strategy:
            move, prediction, reasoning = self.apply_strategy()
        else:
            move, prediction, reasoning = await self.model_based_prediction(round_id, nb_rounds)

        outcome = self.determine_winner(move, opponent_move)
        self.update_score(outcome)

        prediction_current_score = 0.0
        if self.prediction and prediction in ["Head", "Tail"]:
            if prediction == opponent_move:
                prediction_current_score = 1.0
                self.prediction_score += 1

        round_result = {
            "Your Move": move,
            "Prediction": prediction,
            "Opponent Move": opponent_move,
            "Reasoning": reasoning,
            "Outcome": outcome,
            "Current Player Prediction Score Game": self.prediction_score,
            "PredictionOutcome": prediction_current_score

        }
        self.history.append(round_result)
        print(f"Round {round_id} : {round_result}")
        return round_result

    async def model_based_prediction(self, round_id, nb_rounds) -> Dict:
        history_summary = self.get_history_summary()
        instruction = f"""
        You are playing to Matching pennies.
        There are two players: you and an opponent.
        In each round, both secretly choose, at the same time, “Heads” or “Tails”.
        If both choices are the same (make the same choice as your opponent), you gain 1 point and the opponent loses 1 point.
        If the choices are different (make the opposite choice of your opponent), the opponent gains 1 point and you lose 1 point.
        Your goal: Maximize your total gain over {nb_rounds} rounds.

        We are at round number {round_id}.
        Here is the complete game history of moves (yours and your opponent’s) and the current score:
        {history_summary}
        Use this history to try to predict the next opponent's move (whether it is random, pattern-based, or strategic).
        And use this history and your prediction to choose your next move ("Head" or "Tail") in order to maximize your total gain.
        """

        if not self.prediction:
            instruction += """
                        Respond ONLY with JSON format: {{
                            "move": "Head" | "Tail",
                            "prediction": "None",
                            "reasoning": "Explain your decision based on your preferences and the past moves"
                        }}
                        """
        else:
            instruction += """
                        Respond ONLY with JSON format: {{
                            "move": "Head" | "Tail",
                            "prediction": "Head" | "Tail",
                            "reasoning": "Explain how you predicted the opponent's move and how you chose your response"
                        }}
                        """

        if ":" in self.model:  # Pagoda
            return await self.run_pagoda(instruction)

        if self.model.startswith("aws-claude"):
            return await self.run_aws_claude(instruction)

        for attempt in range(1, self.max_retries + 1):
            agent = AssistantAgent(
                name="Player",
                model_client=self.model_client,
                system_message="You are a helpful assistant."
            )
            response = await agent.on_messages(
                [TextMessage(content=instruction, source="user")],
                cancellation_token=CancellationToken(),
            )
            try:
                response_data = response.chat_message.content
                agent_response = AgentResponse.model_validate_json(response_data)
                return agent_response.move, agent_response.prediction, agent_response.reasoning
            except (ValidationError, json.JSONDecodeError) as e:
                print(f"Attempt {attempt}: Failed to parse model response. Error: {e}")
        raise ValueError("Model failed to provide a valid response after multiple attempts.")

    async def run_pagoda(self, instruction: str):
        headers = {
            "Authorization": f"Bearer {PAGODA_API_KEY}",
            "Content-Type": "application/json"
        }
        payload = {
            "model": self.model,
            "temperature": self.temperature,
            "prompt": instruction,
            "stream": False
        }

        for attempt in range(self.max_retries):
            try:
                response = requests.post(self.base_url, headers=headers, json=payload)
                response.raise_for_status()
                response_data = response.json()
                raw_response = response_data.get("response", "")
                parsed_json = self.extract_json_from_response(raw_response)

                if not parsed_json:
                    print(f"Attempt {attempt+1}: Could not parse JSON - Raw response: {raw_response}")
                    continue

                agent_response = AgentResponse(**parsed_json)
                if agent_response.move in ["Head", "Tail"]:
                    return agent_response.move, agent_response.prediction, agent_response.reasoning
            except Exception as e:
                print(f"Attempt {attempt+1}: Error in run_pagoda - {e}")
        raise ValueError("run_pagoda failed to get a valid response.")

    async def run_aws_claude(self, instruction: str):
        import json
        body = json.dumps({
            "anthropic_version": "bedrock-2023-05-31",
            "max_tokens": 1024,
            "temperature": self.temperature,
            "messages": [
                {
                    "role": "user",
                    "content": [
                        {"type": "text", "text": instruction}
                    ]
                }
            ]
        })
        response = self.bedrock_client.invoke_model(
            modelId=self.bedrock_model_id,
            contentType="application/json",
            accept="application/json",
            body=body
        )
        resp_json = json.loads(response["body"].read())
        # Le texte est dans resp_json["output_text"] ou resp_json["content"][0]["text"] selon la version
        raw_text = resp_json["content"][0]["text"]
        parsed_json = self.extract_json_from_response(raw_text)
        agent_response = AgentResponse(**parsed_json)
        return agent_response.move, agent_response.prediction, agent_response.reasoning

    def extract_json_from_response(self, text: str) -> dict:
        try:
            json_str = re.search(r"\{.*\}", text, re.DOTALL)
            if json_str:
                return json.loads(json_str.group())
        except Exception as e:
            print(f"Error extracting JSON: {e}")
        return {}

    def apply_strategy(self):
        """Play the next move using a heuristic."""
        prediction = ""
        print(self.model)
        if self.model == "gpt-4.5-preview-2025-02-27":
            moves = ["Head", "Tail"]
            # If no rounds played, start with "Head"
            if not self.history:
                move = "Head"
                prediction = "Tail" if self.prediction else "None"
                reasoning = (
                        "First round, no history. Starting with 'Head'. "
                        + (f"Predicting opponent starts with 'Tail' (alternating)." if self.prediction else "")
                )
                return move, prediction, reasoning
            # Get last move you played and the opponent's last move
            last_agent_move = self.history[-1]["Your Move"]
            last_opponent_move = self.history[-1]["Opponent Move"]
            # Alternate your move from last time
            move = "Tail" if last_agent_move == "Head" else "Head"
            # Prediction: Suppose opponent is also alternating
            if self.prediction:
                prediction = "Tail" if last_opponent_move == "Head" else "Head"
            else:
                prediction = "None"
            reasoning = (
                    f"Last round I played {last_agent_move}, opponent played {last_opponent_move}. "
                    f"I'm alternating my move to '{move}'. "
                    + (
                        f"Predicting opponent will alternate to '{prediction}'."
                        if self.prediction else "No prediction mode."
                    )
            )
            return move, prediction, reasoning
        if self.model == "mistral-small":
            if not self.history:
                # If there is no history yet, play randomly.
                moves = ["Head", "Tail"]
                return random.choice(moves), f"First round, choosing {random.choice(moves)}."
            head_count = 0
            tail_count = 0
            for move in [r['Opponent Move'] for r in self.history]:
                if move == 'Head':
                    head_count += 1
                elif move == 'Tail':
                    tail_count += 1
            # If there are more heads, play Tail and vice versa.
            if head_count > tail_count:
                next_move = "Tail"
            elif tail_count > head_count:
                next_move = "Head"
            else:  # Equal counts
                moves = ["Head", "Tail"]
                next_move = random.choice(moves)
            reasoning = f"Opponent's 'Head' count: {head_count}, 'Tail' count: {tail_count}. Chose to play '{next_move}' based on the opponent's move frequency."
            return next_move, "None", reasoning
        if self.model == "qwen3":
            move = random.choice(["Head", "Tail"])
            prediction = move  # Assume the opponent will match our move
            reasoning = f"Choosing randomly. Assuming the opponent will match my move {move}."
            return move, prediction, reasoning
        return "None", "None", "None"

    @staticmethod
    def determine_winner(player_move: str, opponent_move: str) -> int:
        if player_move == "None":
            return 0
        if player_move == opponent_move:
            return 1  # Win
        else:
            return -1  # Loss

    # Sample opponent strategy
    def alternative_opponent_strategy(history):
        moves = ["Head", "Tail"]
        return moves[len(history) % len(moves)]

    def update_score(self, outcome: int):
        """Updates the score based on the outcome."""
        self.player_score_game += outcome

    def get_history_summary(self) -> str:
        if not self.history:
            return "This is the first round, there is no history."
        summary = "\n".join(
            [
                f"Round {i + 1}: You played {r['Your Move']}, Opponent played {r['Opponent Move']}. Outcome: {r['Outcome']}"
                for i, r in enumerate(self.history)]
        )
        summary += f"\nCurrent Score - You: {self.player_score_game}\nCorrect Predictions: {self.prediction_score}/{len(self.history)}"
        return summary


# Runner
async def main():
    game = MP(
        model="aws-claude-3-7-sonnet",     # "gpt-4.1", "aws-claude-3-7-sonnet", "aws-claude-3-5-sonnet", "aws-claude-3-haiku", "qwen3", "llama3", "llama3.3", "mixtral", "mistral-small", "deepseek-r1"
        temperature=0,
        game_id=1,
        prediction=True,
        opponent_strategy_fn=lambda history: "Tail" if len(history) % 2 == 0 else "Head",
        strategy=False  # or True for rule-based
    )
    num_rounds = 10
    for round_id in range(1, num_rounds + 1):
        await game.play_round(round_id, num_rounds)

    print(f"Final Score: {game.player_score_game}")
    print(f"Correct Predictions: {game.prediction_score}/{num_rounds}")
    accuracy = game.prediction_score / num_rounds * 100
    print(f"Prediction Accuracy: {accuracy:.1f}%")

if __name__ == "__main__":
    asyncio.run(main())
