import random
import importlib.util
from utils.llm_service import client
import os
import shutil
from typing import List, Dict, Any, Callable
import json
import traceback
from Agent_block import AGENT_BLOCKS
from FlowGen import FlowGen

class FlowGenome:
    def __init__(self, task_info, tools: Dict[str, Callable]=None):
        """Initialize the FlowGenome class."""

        self.prompt_task = task_info
        self.strategies = {
            "1": "get_prompt_Exp1",
            "2": "get_prompt_Exp2",
            "3": "get_prompt_Exploit1",
            "4": "get_prompt_Exploit2",
            "5": "get_prompt_Exploit3"
        }
        self.tools = tools

        self.format_prompt = f"""
            NOTE:
            1.You need to implement it by instantiating the two existing basic Agent classes Actor(tool) and Verifier(). 
            2.You can obtain results by calling the process(prompt) method; Actor will return {{'result': str, 'observation': str}}; Verifier will return {{'is_valid': bool, 'evaluation': str}}. 
            3.Please use correct variable names and keys to ensure correct communication between Agents.
            4.Please use f-string formatting for the prompt to avoid key errors.
            5.If you need to use Verifier, there must be an Actor to fix the result according to the evaluation.
            6. The MultiAgentSystem class must have the following structure:
            def __init__(self, name: str, tools=None) -> None:
                self.name = name
                self.tools = tools
                ...
            def run(self, task: str): # Function name must be run; Must accept variable task.
                # Import necessary packages
                ...
                # Implement the agent flow here.
                ...
                # Must return the final answer to the task; Key name must be answer; Just need one solution.
                return {{"answer": str, ...}}
            
            """
        self.agent_blocks = f"7.You can use Agent_block_library to help you design Agent flow, here are the blocks: \n{AGENT_BLOCKS}\n"
        self.prompt_law = f"""
        Here are some principles for prompt design:
        1. You can use identity setting in the prompt to improve accuracy, such as "you are a mathematician, ..."
        2. It is also helpful to introduce a small number of examples about the task in the prompt.
        3. Special symbol designs can help the agent better understand the task.
        4. You can also try new innovations!

        """ 

    def get_prompt_Exp1(self, indivs):
        """create new agent flow from existing agent flows."""
        prompt_indiv = ""
        for i, indiv in enumerate(indivs):
            prompt_indiv += f"No.{i+1} agent flow and the corresponding code are:\n{indiv['code']} \n"
        prompt_content = (
            f"{self.prompt_task}\n"
            f"I have {len(indivs)} existing agent flow with their codes as follows:\n"
            f"{prompt_indiv}"
            "Please help me create a new agent flow that has a totally different form from the given ones in structure and prompts.\n"
            f"{self.format_prompt}"
            f"{self.agent_blocks}"
            "First, describe your new agent flow and main steps in one sentence. "
            "Then, please return the Python implementation of the MultiAgentSystem class in JSON format. "
            f"{{'plan': str, 'code': str, 'num_agent': int}}"
        )
        return prompt_content
    
    def get_prompt_Exploit1(self, indivs):
        """create new agent flow motivated by existing ones."""
        prompt_indiv = ""
        for i, indiv in enumerate(indivs):
            prompt_indiv += (
                f"No.{i+1} agent flow and the corresponding code are:\n{indiv['code']}\n"
            )
        prompt_content = (
            f"{self.prompt_task}\n"
            f"I have {len(indivs)} existing agent flows with their codes as follows:\n"
            f"{prompt_indiv}"
            "Please help me create a new agent flow that has a totally different form from the given ones but can be motivated from them.\n"
            f"{self.format_prompt}"
            f"{self.agent_blocks}"
            "Firstly, identify the common backbone idea in the provided agent flows. "
            "Secondly, based on the backbone idea describe your new agent flow in one sentence. "
            "The description must be inside a brace. Thirdly, implement it in Python as a function named "
            "Then, please return the Python implementation of the MultiAgentSystem class in JSON format. "
            f"{{'plan': str, 'code': str, 'num_agent': int}}"
        )
        return prompt_content
    
    def get_prompt_Exp2(self, indiv1):
        """modify one agent flow."""
        prompt_content = (
            f"{self.prompt_task}\n"
            "I have one agent flow with its code as follows. "
            f"agent flow description: {indiv1['plan']}\n"
            f"Code:\n{indiv1['code']}\n"
            "Please assist me in creating a new agent flow that has a different form but can be a modified version of the agent flow provided.\n"
            f"{self.format_prompt}"
            f"{self.agent_blocks}"
            "First, describe your new agent flow and main steps in one sentence. "
            "The description must be inside a brace. Next, implement it in Python as a function named "
            "Then, please return the Python implementation of the MultiAgentSystem class in JSON format. "
            f"{{'plan': str, 'code': str, 'num_agent': int}}"
        )
        return prompt_content
    
    def get_prompt_Exploit2(self, indiv1):
        """change prompt settings of one agent flow."""
        prompt_content = (
            f"{self.prompt_task}\n"
            "I have one agent flow with its code as follows. "
            f"agent flow description: {indiv1['plan']}\n"
            f"Code:\n{indiv1['code']}\n"
            "You are a prompt optimization master, please keep the agent flow structure unchanged, only optimize the corresponding prompt.\n"
            f"{self.prompt_law}"
            #f"{self.format_prompt}"
            #f"You cannot add or reduce the original number of agents: {indiv1['num_agent']}."
            "First, describe your main idea and main steps in one sentence. "
            "Then, please return the Python implementation of the MultiAgentSystem class in JSON format. "
            f"{{'plan': str, 'code': str, 'num_agent': int}}"
        )
        return prompt_content
    
    def get_prompt_Exploit3(self, indiv1):
        """simplify components to enhance generalization."""
        prompt_content = (
            f"{self.prompt_task}\n"
            "First, you need to identify the main components in the function below. "
            "Next, analyze whether any of these components can be overfit to the in-distribution instances. "
            "Then, based on your analysis, simplify the components to enhance the generalization to potential out-of-distribution instances. "
            "Finally, provide the revised code, keeping the function name, inputs, and outputs unchanged.\n"
            f"{indiv1['code']}\n"
            f"{self.format_prompt}"
            "Then, please return the Python implementation of the MultiAgentSystem class in JSON format. "
            f"{{'plan': str, 'code': str, 'num_agent': int}}"
        )
        return prompt_content


    def code_test(self, code):
        with open("flow_genome_tmp.py", "w") as f:
            f.write(code)
        try:
            importlib.util.spec_from_file_location("flow_genome_tmp", "flow_genome_tmp.py")
            flow_mod = importlib.util.module_from_spec(spec)
            spec.loader.exec_module(flow_mod)
            system = flow_mod.MultiAgentSystem("EvoTest")
            system.run(self.task_info)
            return True
        except Exception as e:
            print(f"Failed to run code: {e}")
            return False
    
    def evolve(self, strategy_type, parents, llm="gpt-4o-mini", debug=False):
        method_name = self.strategies.get(strategy_type)
        if not method_name or not hasattr(self, method_name):
            raise ValueError(f"Unknown or unimplemented prompt type: {strategy_type}")
        prompt_func = getattr(self, method_name)
        prompt = prompt_func(parents)

        response = client().chat.completions.create(
            model=llm,
            messages=[{"role": "system", "content": prompt}],
            response_format={"type": "json_object"}
        )
        result = response.choices[0].message.content
        result = json.loads(result)
        
        # 将result中的code写入.py文件检查其是否能成功运行
        if debug:
            return self.code_test(result["code"])

        return result


class EvoOptimizer:
    def __init__(self, task_info, tools=None, population_size=5, initial_population=None, llm="gpt-4o-mini" ):
        """初始化进化优化器
        
        Args:
            task_info: 任务描述信息
            population_size: 种群大小
            initial_population: 初始种群，如果为None则随机生成
            llm: 使用的大语言模型
        """
        self.task_info = task_info
        self.population_size = population_size
        self.llm = llm
        self.tools = tools
        self.flow_gen = FlowGen(task_info, tools)

        # 初始化种群
        if initial_population:
            self.population = initial_population
            self.population_size = len(initial_population)
            if self.population_size < population_size:
                for _ in range(population_size - self.population_size):
                    flow = self.flow_gen.generation()
                    self.population.append({
                        "code": flow["code"],
                        "plan": flow["plan"],
                        "num_agent": flow["num_agent"],
                        "fitness": -1  
                    })
        else:
            # 如果没有初始种群，创建随机种群
            self.population = []
            for _ in range(population_size):
                flow = self.flow_gen.generation()
                self.population.append({
                    "code": flow["code"],
                    "plan": flow["plan"],
                    "num_agent": flow["num_agent"],
                    "fitness": -1  
                })
        
        with open("ini_flow.json", "w", encoding="utf-8") as f:
            json.dump(self.population, f, ensure_ascii=False, indent=2)
        self.flow_evo = FlowGenome(task_info, tools=self.tools)
        
        # 策略及其使用概率
        self.strategies = list(self.flow_evo.strategies.keys()) # 对应不同的进化策略
        self.strategy_weights = [0.5, 0.5, 0.8, 0.8, 0.8]  # 各策略的使用概率
        

    def evaluate(self, individual, benchmark_type="gsm-8k", mode="train", difficulty=None, sample_size=None):
        """评估个体的适应度
        
        Args:
            individual: 待评估的个体
            benchmark_type: 基准测试类型
            mode: 评估模式
            difficulty: 难度级别（用于课程学习）
            sample_size: 样本大小（用于课程学习）
            
        Returns:
            float: 适应度分数
        """
        try:
            # 将代码写入临时文件
            with open("flow_genome_tmp.py", "w", encoding="utf-8") as f:
                f.write(individual["code"])
            
            # 动态导入
            spec = importlib.util.spec_from_file_location("flow_genome_tmp", "flow_genome_tmp.py")
            flow_mod = importlib.util.module_from_spec(spec)
            spec.loader.exec_module(flow_mod)
            
            # 创建系统并评测
            system = flow_mod.MultiAgentSystem("EvoTest", self.tools)
            
            # 如果有基准测试数据，使用它进行评估
            if benchmark_type == "gsm-8k":
                if difficulty and sample_size:
                    # 使用课程学习版本的评估
                    from Evaluation.Eval_GSM8k_Curriculum import Eval_Curriculum
                    return Eval_Curriculum(agentflow=system, difficulty=difficulty, sample_size=sample_size)
                else:
                    # 使用原版评估
                    from Evaluation.Eval_GSM8k import Eval
                    return Eval(agentflow=system, mode=mode, sample_size=sample_size)
            elif benchmark_type == "math":
                from Evaluation.Eval_MATH import Eval
                # MATH评估支持难度级别
                return Eval(agentflow=system, mode=mode, level=difficulty, sample_size=sample_size)
            else:
                return 0.0
                
        except Exception as e:
            print(f"评估失败: {e}")
            print(traceback.format_exc())
            return 0.0  # 执行失败的个体适应度为0
    
    def select_parents(self, fitnesses, num_parents=2):
        """使用轮盘赌选择父代
        
        Args:
            fitnesses: 适应度列表
            num_parents: 需要选择的父代数量
            
        Returns:
            list: 选中的父代索引列表
        """
        # 确保适应度非负
        min_fitness = min(fitnesses)
        if min_fitness < 0:
            adjusted_fitnesses = [f - min_fitness for f in fitnesses]
        else:
            adjusted_fitnesses = fitnesses
        
        # 计算总适应度
        total_fitness = sum(adjusted_fitnesses)
        if total_fitness == 0:  # 避免除零错误
            # 如果所有适应度都为0，则均等概率选择
            return random.sample(range(len(fitnesses)), num_parents)
        
        # 轮盘赌选择
        selected = []
        for _ in range(num_parents):  # 选择num_parents个父代
            pick = random.uniform(0, total_fitness)
            current = 0
            for i, f in enumerate(adjusted_fitnesses):
                current += f
                if current > pick:
                    selected.append(i)
                    break
            # 如果没有选中（浮点数精度问题），选择最后一个
            if len(selected) <= _:
                selected.append(len(fitnesses) - 1)
        
        return selected
    

    def evolve(self, generations=10, benchmark_type="gsm-8k"):
        """执行进化过程
        
        Args:
            generations: 进化代数
            benchmark_type: 基准测试类型
            
        Returns:
            dict: 最佳个体
        """
        best_individual = None
        best_fitness = -1
        
        # 创建结果目录
        os.makedirs("results/history", exist_ok=True)
        
        for generation in range(generations):
            print(f"\n===== 第 {generation+1}/{generations} 代 =====")
            
            # 评估当前种群
            fitnesses = []
            for i, individual in enumerate(self.population):
                # 如果个体已经评估过，直接使用
                if individual["fitness"] == -1:
                    # 评估个体
                    fitness = self.evaluate(individual, benchmark_type)
                    self.population[i]["fitness"] = fitness

                else:
                    fitness = individual["fitness"]

                fitnesses.append(fitness)

                # 更新最佳个体
                if fitness > best_fitness:
                    best_fitness = fitness
                    best_individual = individual.copy()
            
            # 打印当前代的信息
            avg_fitness = sum(fitnesses) / len(fitnesses) if fitnesses else 0
            print(f"平均适应度: {avg_fitness:.4f}, 最佳适应度: {max(fitnesses):.4f}")
            
            # 如果已经是最后一代，则不需要创建新种群
            if generation == generations - 1:
                break
            
            # 操作符驱动的进化过程
            n_strategy = len(self.strategies)
            new_population = []
            
            # 精英保留 - 保留最佳个体
            best_idx = fitnesses.index(max(fitnesses))
            new_population.append(self.population[best_idx].copy())
            
            # 对每个操作符应用进化
            for i in range(n_strategy):
                strategy = self.strategies[i]
                print(f" Strategy: {strategy}, [{i + 1} / {n_strategy}] ", end="|")
                strategy_w = self.strategy_weights[i]
                
                # 根据权重决定是否使用该操作符
                if (random.random() < strategy_w):
                    
                    # 如果需要多个个体进行进化
                    if strategy == "1" or strategy == "3": 
                        parents = self.select_parents(fitnesses, 2)
                        result = self.flow_evo.evolve(strategy, [self.population[i] for i in parents])
                        fitness = self.evaluate(result)
                    else: #用最佳个体进行进化
                        result = self.flow_evo.evolve(strategy, self.population[best_idx])
                        fitness = self.evaluate(result)


                    if "code" in result and "plan" in result:
                        offspring = {
                            "code": result["code"],
                            "plan": result["plan"],
                            "num_agent": result["num_agent"],
                            "fitness": fitness
                        }
                        
                        new_population.append(offspring)
                   
                        # 保存进化历史
                        history_data = {
                            "parents": parents,
                            "offspring": offspring,
                            "operator": strategy
                        }
                        with open(f"results/history/gen_{generation+1}_strategy_{strategy}.json", "w", encoding="utf-8") as f:
                            json.dump(history_data, f, ensure_ascii=False, indent=2)
                
                # 种群管理 - 确保种群大小不超过限制
                while len(new_population) > self.population_size:
                    # 移除适应度最低的个体
                    min_fitness_idx = 0
                    min_fitness = float('inf')
                    for i, ind in enumerate(new_population):
                        if ind.get("fitness", 0) < min_fitness:
                            min_fitness = ind.get("fitness", 0)
                            min_fitness_idx = i
                    new_population.pop(min_fitness_idx)
                
            
            # 如果新种群数量不足，从原种群中补充
            while len(new_population) < self.population_size:
                # 使用轮盘赌选择
                idx = self.select_parents(fitnesses)[0]
                new_population.append(self.population[idx].copy())
            
            # 更新种群
            self.population = new_population
            
            # 保存当前代的种群
            with open(f"results/gen_{generation+1}_population.json", "w", encoding="utf-8") as f:
                json.dump(self.population, f, ensure_ascii=False, indent=2)
             
        # 返回最佳个体
        return best_individual


    
