from agents.base_agent import BaseAgent_openai
from prompts.validator_agent_prompts import *
from utils.utils import move_file_to_log_dir
from utils.runners import execute_code
from utils.extractors import extract_json
import os
import pandas as pd
import shutil


class ValidatorAPI(BaseAgent_openai):
    def test_train_split(self):
        """
        Split the training sample into test and training samples.

        :return: error/None, validator_filepath/None
        """
        self.clear_context()

        path_to_data = self.config['data_dir_path']
        with open(self.config['background_data_path'], 'r') as f:
            data_description = f.read()

        path_to_sample_submission = os.path.join(self.config['data_dir_path'], "sample_submission.csv")
        sample_submission_head = pd.read_csv(path_to_sample_submission)
        train = pd.read_csv(os.path.join(self.config['data_dir_path'], "train.csv"))

        if self.config["need_pro_validator"]:
            # 1. Get more information about the data
            self.instructions = VALIDATOR_INFO_PROMPT.format(
                path_to_data=path_to_data,
                data_description=data_description,
                save_path=self.config['save_path'],
                sample_submission_head=sample_submission_head
            )
            code_get_info = self.code_generation_from_several_attempts(
                self.config['number_of_attempts_validator'],
                filename_to_save='validator_get_info.py',
                need_extract_code=True,
                need_execute=True,
                need_checker=False,
                log_prefix="GET_INFO"
            )
            validator_get_info_filepath = self.save_code_to_file(code_get_info, 'validator_get_info.py',
                                                                 need_save=False)
            if code_get_info is None:
                info_about_data = WITHOUT_RECOMMENDATION_TEXT
            else:
                info_about_data, error = execute_code(
                    validator_get_info_filepath, self.config["path_debug_log"], self.agent_name
                )
                if error is not None:
                    info_about_data = WITHOUT_RECOMMENDATION_TEXT

            # 2. Analysis
            self.clear_context()
            if info_about_data != WITHOUT_RECOMMENDATION_TEXT:
                self.instructions = VALIDATOR_ANALYZER_PROMPT.format(
                    info_about_data=info_about_data
                )
                recommendations_json = extract_json(self.generate_response())
                if isinstance(recommendations_json, dict) and "recommendations" in recommendations_json:
                    recommendations = str(recommendations_json["recommendations"])
                else:
                    recommendations = WITHOUT_RECOMMENDATION_TEXT
            else:
                recommendations = WITHOUT_RECOMMENDATION_TEXT

            recommendations += f"\nI'll give you the size of the training sample: (rows, columns) {train.shape}"
        else:
            recommendations = WITHOUT_RECOMMENDATION_TEXT

        recommendations += f"\nI'll give you the size of the training sample: (rows, columns) {train.shape}"

        # 3. Data split
        self.clear_context()
        self.instructions = VALIDATOR_SPLIT_PROMPT.format(
            path_to_data=path_to_data,
            save_path=self.config['save_path'],
            data_description=data_description,
            sample_submission_head=sample_submission_head,
            recommendations=recommendations,
            subset_size_in_percent=self.config["subset_size_in_percent"],
            size_threshold=self.config["validator_size_threshold"],
            path_to_sample_submission=path_to_sample_submission
        )
        move_file_to_log_dir(
            competition_dir=self.config['data_dir_path'],
            log_dir=self.config['save_path']
        )
        code = self.code_generation_from_several_attempts(
            self.config['number_of_attempts_validator'],
            filename_to_save='validator.py',
            need_extract_code=True, need_execute=True,
            log_prefix="SPLITTING"
        )
        if code is None:
            return f"The validator was unable to generate the code", None

        shutil.copy2(
            os.path.join(self.config['save_path'], "test_submit.csv"),
            os.path.join(self.config['save_path'], "sample_submission.csv")
        )
        validator_filepath = self.save_code_to_file(code, 'validator.py', need_save=False)
        return None, validator_filepath
