import os
import time
from utils.extractors import *
from utils.runners import execute_code
import requests
import pandas as pd
from prompts.base_agent_prompts import *
import subprocess
import sys


class BaseAgent_openai:
    def __init__(self, config, agent_name, debug_logger, main_logger,
                 sub_logger, checker=None, rag_agent=None):
        self.url = config['URL']

        self.instructions = ''
        self.agent_name = agent_name
        self.model_name = config['model_name']
        self.api_key = config['api_key']
        self.main_logger = main_logger
        self.sub_logger = sub_logger
        self.debug_logger = debug_logger
        self.checker = checker
        self.config = config
        self.context = []

    def add_message_to_context(self, role, content):
        """Adds a message from a user or an agent's response to the context information"""
        self.context.append({"role": role, "content": content})

    def clear_context(self):
        """Reinitialized the context information array"""
        self.context = []

    def install_packages(self, error):
        """Installs missing libraries based on error code"""
        self.clear_context()
        self.instructions = INSTALL_PACKAGES_PROMPT.format(error=error)
        code = extract_code(self.generate_response(''))
        parts = code.strip().split()
        if parts[0] in ('pip', 'pip3'):
            packages = parts[2:]
        else:
            packages = [p for p in parts if not p.startswith('-')]
        subprocess.check_call([sys.executable, "-m", "pip", "install", *packages])

    def write_running_time(self, start_work):
        end_work = time.time()
        times_path = os.path.join(self.config["path_debug_log"], "times.csv")
        times_df = pd.read_csv(times_path)
        seconds = round(end_work - start_work)
        new_row = {
            'agent': self.agent_name,
            'running_time_in_seconds': seconds,
            "running_time_in_minutes": seconds // 60
        }
        times_df = pd.concat([times_df, pd.DataFrame([new_row])], ignore_index=True)
        times_df.to_csv(times_path, index=False)

    def code_generation_from_several_attempts(self, number_of_attempts: int,
                                              need_extract_code: bool = False, need_execute: bool = False,
                                              input_text: str = '', filename_to_save: str | None = None,
                                              **params):
        """
        Generate a response from LLM with further verification of the result,
        in particular through the Checker, if necessary

        :param number_of_attempts: number of attempts allowed for correct response generation
        :param need_extract_code: (bool) should the agent issue python code?
        :param need_execute: (bool) is it necessary to check the code for executability?
        :param input_text: additional text in addition to the instructions
        :param filename_to_save: file name for saving the code
        :param params: other parameters, in particular images for context, stage name, etc.
        :return:
        """
        if "need_checker" not in params:
            need_checker = self.agent_name in self.config['agents_for_checker']
        else:
            need_checker = params["need_checker"]

        if "log_prefix" in params:
            log_prefix = f' {params["log_prefix"]}'
        else:
            log_prefix = ""

        need_clear = need_checker
        for attempt in range(number_of_attempts):
            if not need_clear:
                # The context of previous launches is only necessary for further verification by the checker
                self.clear_context()
            self.sub_logger.info(
                f"⬛{log_prefix} {self.agent_name.title()} Attempt: {attempt + 1}/{number_of_attempts}")

            images = None if "images" not in params else params['images']
            result = self.generate_response(input_text, images=images)
            if need_extract_code:
                result = extract_python_code(result)
            if result:
                # If no additional verification from the checker is required,
                # we consider the result to be generated correctly

                # Else, perform a check using a checker
                if need_checker:
                    if need_execute:
                        filepath = self.save_code_to_file(result, filename_to_save)
                        code_output, error = execute_code(filepath, self.config["path_debug_log"], self.agent_name)
                        if error is not None:
                            error_title = extract_error_title(error)
                            self.sub_logger.info(f"Errors occurred while running the code:\n{error_title}")
                            self.add_message_to_context("user", error_title)
                            continue

                    match self.agent_name:
                        case "validator":
                            # Manually check for the presence of files that needed to be created
                            are_the_files_created = True
                            for file in ['train.csv', 'test.csv', 'test_submit.csv']:
                                if not os.path.exists(os.path.join(self.config['save_path'], file)):
                                    are_the_files_created = False
                                    break
                            is_it_correct, description = self.checker.check_the_code_for_correctness(
                                self.agent_name,
                                result,
                                are_the_files_created=are_the_files_created,
                                save_path=self.config['save_path'],
                                path_to_data=self.config['data_dir_path']
                            )
                        case 'scorer':
                            code = extract_python_code(result)
                            mode_scoring_json = extract_json(result)

                            got_a_code = bool(code is not None)
                            error = NO_ERROR_WITHOUT_CODE
                            if got_a_code:
                                filepath = self.save_code_to_file(code, 'evaluation.py')
                                sample_submission_path = os.path.join(self.config['save_path'], 'test_submit.csv')
                                _, error = execute_code(
                                    filepath, self.config["path_debug_log"], "scorer",
                                    args=["--test_path", sample_submission_path, "--predict_path",
                                          sample_submission_path]
                                )
                                if error is not None:
                                    self.sub_logger.info(
                                        f"Errors occurred while running the code from scorer on sample submission:\n{error}"
                                    )
                            # Checking the correctness of the generated JSON
                            got_a_json = bool(mode_scoring_json is not None)
                            got_a_keys = False  # Is there a “mode” key in json?
                            got_a_mode_scoring = False  # Are the mode values in that correct range?
                            if got_a_json:
                                got_a_keys = bool('is_higher_better' in mode_scoring_json)
                                mode_scoring = mode_scoring_json['is_higher_better']
                                got_a_mode_scoring = isinstance(mode_scoring, bool)

                            is_it_correct, description = self.checker.check_the_code_for_correctness(
                                self.agent_name,
                                result,
                                got_a_code=got_a_code,
                                got_a_json=got_a_json,
                                got_a_keys=got_a_keys,
                                got_a_mode_scoring=got_a_mode_scoring,
                                error=error
                            )
                        case "insighter":
                            insights_json = extract_json(result)

                            # We manually check the correctness of json and
                            # whether the number of ideas corresponds to the requested number
                            got_a_json = bool(insights_json is not None)
                            ideas_match_config = False
                            if got_a_json:
                                ideas_match_config = bool(len(insights_json['insights']) == params['number_of_ideas'])

                            is_it_correct, description = self.checker.check_the_code_for_correctness(
                                self.agent_name,
                                agent_output=result,
                                number_of_ideas=params['number_of_ideas'],
                                got_a_json=got_a_json,
                                ideas_match_config=ideas_match_config,
                                task_name=params['task_name']
                            )
                        case "coder":
                            # Performs verification of the generated code for compliance with stage requirements
                            match params['task_name']:
                                case "Model training":
                                    is_it_correct, description = self.checker.check_the_code_for_correctness(
                                        self.agent_name,
                                        result,
                                        task_name=params['task_name'],
                                        idea=params['idea'],
                                        node_index=params["node_index"],
                                        parent_index=params["parent_index"],
                                    )
                                case "Data preparation and feature engineering":
                                    is_it_correct, description = self.checker.check_the_code_for_correctness(
                                        self.agent_name,
                                        result,
                                        task_name=params['task_name'],
                                        idea=params['idea'],
                                        node_index=params["node_index"]
                                    )
                                case _:
                                    raise KeyError(f"{params['task_name']} not found")
                        case _:
                            raise KeyError(f"Agent {self.agent_name} not found in Checker")

                    if not is_it_correct:
                        self.add_message_to_context("user", description)
                        continue
                    self.sub_logger.info("✅ Checker approved")
                elif need_execute:
                    filepath = self.save_code_to_file(result, filename_to_save)
                    code_output, error = execute_code(filepath, self.config["path_debug_log"], self.agent_name)
                    if error is not None:
                        error_title = extract_error_title(error)
                        self.sub_logger.info(f"Errors occurred while running the code:\n{error_title}")
                        self.add_message_to_context("user", error_title)
                        need_clear = False
                        continue

                return result
            else:
                self.sub_logger.info(
                    "Unable to obtain agent output (result is empty), "
                    "switching API key"
                )
                self.api_key = next(self.config['api_keys'])
        else:
            return None

    def generate_response(self, user_input: str = '', images: list | None = None) -> str:
        """
        Function for generating a response from LLM.

        :param user_input: additional text to the instructions
        :param images: images that must be in context
        :return: generated response (string)
        """
        if user_input:
            self.add_message_to_context("user", user_input)

        messages = []
        if self.instructions:
            messages.append({"role": "user", "content": self.instructions})
        for msg in self.context:
            role = msg["role"]
            messages.append({"role": role, "content": msg["content"] + ' '})

        messages_for_debug = messages.copy()  # to ignore images when outputting to debug logs
        if images is not None:
            image_entries = [{"role": "user", "content": img} for img in images]
            messages.extend(image_entries)
            # Consume images only once
            images = None

        response_text = ''
        response = {}

        while not response_text:
            self.debug_logger.info(
                f'{self.config["model_name"]}, {self.api_key}, {self.url}'
            )

            data = {
                "timeout": self.config['timeout'],
                "api_key": self.api_key,
                "model_name": self.config["model_name"],
                "content": messages,
            }

            if 'model_type' in self.config:
                data['model_type'] = self.config['model_type']

            try:
                response = requests.post(self.url, json=data, timeout=self.config['timeout'])
                response = response.json()
            except requests.exceptions.Timeout:
                self.api_key = next(self.config['api_keys'])
                self.config['api_key'] = self.api_key
                # self.url = next(self.config["URLS"])
                self.main_logger.info("Request timeout, switching API key")
                continue
            except Exception as e:
                self.api_key = next(self.config['api_keys'])
                self.config['api_key'] = self.api_key
                # self.url = next(self.config["URLS"])
                self.main_logger.info(f"JSON decode or network error: {e}")
                continue

            if response.get('status') == 'error':
                error = response.get('error', '')
                if error == 'Timeout':
                    self.api_key = next(self.config['api_keys'])
                    self.config['api_key'] = self.api_key
                    # self.url = next(self.config["URLS"])
                    self.main_logger.info("Request timeout, switching API key")
                    continue
                elif error == "InternalServerError":
                    self.main_logger.info("Internal server error")
                    continue
                try:
                    retry_delay = extract_retry_delay(str(error))
                except ValueError:
                    retry_delay = 60
                if not isinstance(retry_delay, int):
                    retry_delay = 60

                self.api_key = next(self.config['api_keys'])
                self.config['api_key'] = self.api_key
                # self.url = next(self.config["URLS"])
                self.main_logger.info(f"Quota error. Switch API key")

                # Uncomment if needed
                # retry_delay = 5
                # self.main_logger.info(f"Sleep {retry_delay} seconds")
                # time.sleep(retry_delay)
                continue

            response_text = response['text']
            break

        response_text = str(response_text)
        self.add_message_to_context("assistant", response_text)

        # Debug логи
        messages_for_debug.append({"role": "assistant", "content": response_text + ' '})
        self.debug_logger.info(f'Agent: {self.agent_name}')
        for message in messages_for_debug:
            emoji = "👨" if message['role'] == 'user' else "💻"
            self.debug_logger.info(f"{emoji} role: {message['role']}")
            self.debug_logger.error(f"🔊 content: {message['content']}")

        if "input_tokens" in response:
            try:
                tokens_path = os.path.join(self.config["path_debug_log"], "tokens.csv")
                tokens_df = pd.read_csv(tokens_path)
                new_row = {
                    'agent': self.agent_name,
                    'input_tokens': response["input_tokens"],
                    'output_tokens': response["output_tokens"]
                }
                tokens_df = pd.concat([tokens_df, pd.DataFrame([new_row])], ignore_index=True)
                tokens_df.to_csv(tokens_path, index=False)
            except Exception as e:
                self.main_logger.error(f"Token logging failed: {e}")

        return response_text

    def save_code_to_file(self, code: str, filename: str, pre_path: str = 'code', need_save: bool = True):
        """
        Create a file and save the code there or just return file path

        :param code: python code that needs to be saved to a file
        :param filename: the name of the file to be created and in which the code should be written
        :param pre_path: relative path to the file location
        :param need_save: Should I save or just return the path to the file?
        :return: file_path - absolute path to the saved file
        """
        if pre_path:
            path_to_save = os.path.join(self.config['path_log'], pre_path)
        else:
            path_to_save = self.config['path_log']
        try:
            os.makedirs(path_to_save, exist_ok=True)
        except Exception as e:
            raise f"Error creating directory: {e}"

        file_path = os.path.join(path_to_save, filename)
        if need_save:
            with open(file_path, "w", encoding="utf-8") as file:
                file.write(code)

        return file_path