import json

from agents.baseline_agent import BaselinerAPI
from agents.debug_agent import DebugAgentAPI
from agents.insight_agent import InsightAgentAPI
from agents.reader_agent import ReaderAgentAPI
from agents.validator_agent import ValidatorAPI
from agents.scorer_agent import ScorerAPI
from agents.code_agent import CodeAgentAPI
from agents.checker_agent import CheckerAPI
from agents.estimate_agent import EstimateAgent
from agents.rag_agent import RagAgentAPI
from agents.reasoner_agent import ReasonerAPI
from algorithms.adding import Adding_algorithms
from algorithms.merging import MergingManager

from utils.arxiv_parser import parse_arxiv
from utils.kaggle_parser import parse_kaggle
from sentence_transformers import SentenceTransformer
import time
from utils.utils import replace_dirs, write_running_time
from utils.runners import execute_code
from utils.extractors import extract_python_code
from utils.generate_graphs import generate_all_plots
from collections import defaultdict
import os
import torch, gc


class Pipeline:
    def __init__(self, config, start_time, main_logger, sub_logger, debug_logger):
        self.config = config
        self.main_logger = main_logger
        self.sub_logger = sub_logger
        self.debug_logger = debug_logger
        self.phases = self.config['phases']
        self.state = 'read'
        self.start_time = start_time
        self.rag_agent = None

        self.baseline_score: int | None = None
        self.previous_ideas: list | None = None
        self.background_data: str | None = None
        self.eda_output: str = ''
        self.eda_images: list = []
        self.is_higher_better: bool | None = None

        # An array of nodes in the final stages from which backpropagation will be launched
        self.node_scores: list = []

        # Array of ideas:
        #   1. According to which the metric is calculated on the validation sample
        #   2. The metric of which is submitted to the “estimate_agent” agent
        self.complex_ideas_with_score: None | list = None

        # One idea that is submitted to the “estimate_agent” in order to show how it affects the metric
        self.cross_dataset_idea: str | None = None

        self.checker = CheckerAPI(
            config=config, agent_name='checker',
            debug_logger=debug_logger, main_logger=main_logger, sub_logger=sub_logger
        )
        self.reader = ReaderAgentAPI(
            config=config, agent_name='reader', checker=self.checker,
            debug_logger=debug_logger, main_logger=main_logger, sub_logger=sub_logger
        )
        self.scorer = ScorerAPI(
            config=config, agent_name='scorer', checker=self.checker,
            debug_logger=debug_logger, main_logger=main_logger, sub_logger=sub_logger
        )
        self.validator = ValidatorAPI(
            config=config, agent_name='validator', checker=self.checker,
            debug_logger=debug_logger, main_logger=main_logger, sub_logger=sub_logger
        )
        self.baseliner = BaselinerAPI(
            config=config, agent_name='baseliner', checker=self.checker,
            main_logger=main_logger, sub_logger=sub_logger, debug_logger=debug_logger
        )
        self.debugger = DebugAgentAPI(
            config=config, agent_name='debugger', scorer=self.scorer, checker=self.checker,
            main_logger=main_logger, sub_logger=sub_logger, debug_logger=debug_logger,
        )
        self.reasoner = ReasonerAPI(
            config=config, agent_name='reasoner',
            debug_logger=debug_logger, main_logger=main_logger, sub_logger=sub_logger
        )

        if self.config['use_rag']:
            self.rag_agent = RagAgentAPI(
                config=config, agent_name='rag_agent', main_logger=main_logger,
                sub_logger=sub_logger, debug_logger=debug_logger
            )

        # Agents and algorithms will be initialized in the "start" function of the pipeline
        self.coder: CodeAgentAPI
        self.insighter: InsightAgentAPI
        self.estimator: EstimateAgent
        self.merging_algorithm: MergingManager
        self.adding_algorithm: Adding_algorithms

    def start(self):
        """
        Prepare for tree initialization. Starts the following agents:
            1. Reader -> Get contextual information about the competition
            2. Validator -> Divide the training sample into training and validation
            3. Scorer -> Create a function to evaluate the pipeline
            4. Baseliner -> Create a baseline
        If at least one agent fails to complete the task, the system terminates with an error
        :return: None
        """

        # initialize retrieve model
        retrieve_model = SentenceTransformer('intfloat/multilingual-e5-large')
        self.sub_logger.info(f"✅ Retrieve model initialized")

        # --------- Reader  ---------
        self.main_logger.info("Start reading")
        error, description_file_path = self.reader.get_dataset_description()
        if error:
            self.sub_logger.error(f"❌ Reader fail")
            self.state = 'error'
            return
        self.config['background_data_path'] = description_file_path
        with open(description_file_path, 'r') as f:
            self.background_data = '\n'.join(f.readlines())

        self.sub_logger.info(f"✅ Reading complete. Save file in {description_file_path}")

        # ------- Validator  --------
        self.main_logger.info("Validator start")
        error, validator_filepath = self.validator.test_train_split()
        self.sub_logger.info(f"The code from the Validator save in {validator_filepath}")
        if error is not None:
            self.sub_logger.error(f"❌ Validator fail. Error: {error}")
            self.state = 'error'
            return
        self.sub_logger.info("✅ The Validator has worked successfully!")

        # --------- Scorer  ---------
        self.main_logger.info("Scorer start")
        error, scorer_filepath, self.is_higher_better = self.scorer.get_evaluation_code()
        if error:
            self.sub_logger.error(f"❌ Scorer fail")
            self.state = 'error'
            return
        self.sub_logger.info(
            f"The code from the Scorer save in {scorer_filepath}.\nIs higher better: {self.is_higher_better}")
        self.sub_logger.info("✅ The Scorer has worked successfully!")

        # ------- Rag Agent ------
        if self.rag_agent:
            self.main_logger.info("RagAgent start")
            arxiv_texts = parse_arxiv(self.rag_agent, n=self.config['retrieve_n_papers'])
            kaggle_texts = parse_kaggle(self.config['background_data_path'],
                                        self.config['competitions_path'],
                                        self.config['vector_index_path'],
                                        self.config['metadata_path'],
                                        retrieve_model,
                                        top_n_competitions=self.config['retrieve_n_competitions'],
                                        threshold=0)
            self.rag_agent.pool_ideas = self.rag_agent.generate_pool_ideas(arxiv_texts + kaggle_texts)
            self.sub_logger.info("✅ The RagAgent has worked successfully!")

        self.coder = CodeAgentAPI(
            config=self.config, agent_name='coder',
            main_logger=self.main_logger, sub_logger=self.sub_logger, debug_logger=self.debug_logger,
            checker=self.checker, is_higher_better=self.is_higher_better
        )

        self.debugger.set_coder(self.coder)

        # -------- Baseliner  -------
        self.main_logger.info("Baseliner start")
        path, error, self.baseline_score = self.baseliner.get_baseline(
            debug_agent=self.debugger
        )
        if error is not None:
            self.state = 'error'
            return

        self.sub_logger.info("✅ The Baseliner has worked successfully!")

        # --------  Define remaining agents and algorithms --------
        self.insighter = InsightAgentAPI(
            config=self.config, agent_name='insighter',
            main_logger=self.main_logger, sub_logger=self.sub_logger, debug_logger=self.debug_logger,
            coder=self.coder, checker=self.checker,
            rag_agent=self.rag_agent, retrieve_model=retrieve_model
        )
        retrieve_model.to("cpu")
        del retrieve_model
        gc.collect()
        torch.cuda.empty_cache()

        self.estimator = EstimateAgent(
            config=self.config, agent_name='estimator',
            main_logger=self.main_logger, sub_logger=self.sub_logger, debug_logger=self.debug_logger,
            debugger=self.debugger, coder=self.coder, background_data=self.background_data
        )

        self.merging_algorithm = MergingManager(
            config=self.config,
            is_higher_better=self.is_higher_better,
            debugger=self.debugger, coder=self.coder, insighter=self.insighter,
            sub_logger=self.sub_logger, debug_logger=self.debug_logger
        )
        self.adding_algorithm = Adding_algorithms(
            config=self.config, is_higher_better=self.is_higher_better, insighter=self.insighter,
            sub_logger=self.sub_logger
        )
        self.state = 'InitialState_EDA'

    def forward(self, passage_number: int):
        """
        Execute one step of the pipeline at one of the following stages:
            1. EDA
            2. Data preparation
            3. Modeling
            4. Merging
            5. Adding
            6. Back propagation
        :param passage_number: int - tree passage number
        :return: None
        """
        pre_path_to_save_passage = os.path.join('code', f'passage_number_{passage_number}')
        os.makedirs(os.path.join(self.config['path_log'], pre_path_to_save_passage), exist_ok=True)

        # Phase has the format "InitialState_Stage" or just "Stage"
        phase = self.state.split("_")
        current_state = self.state
        self.main_logger.info(f"Phase: {self.state}")

        self.insighter.clear_context()

        previous_ideas = []
        start_work = time.time()
        if phase[0] == "InitialState":
            if self.config['dynamic_model']:
                self.config['model_name'] = 'gemini-2.0-flash'
            # Phase existence check
            for phase_data in self.phases:
                if phase[1] == phase_data[2]:
                    task_name, filename = phase_data[0], phase_data[1]
                    break
            else:
                phase_data_name = [phase_data[2] for phase_data in self.phases]
                raise ValueError(f"{phase[1]} not in {phase_data_name}")

            # Processing for the first pass. Form the initial tree
            match phase[1]:
                case 'EDA':
                    self.insighter.clear_context()
                    if self.config['dynamic_model']:
                        self.config['model_name'] = 'gemini-2.5-flash'
                    # 1. Generating ideas
                    eda_ideas = self.insighter.generate_eda_ideas()
                    debug_code = None
                    code_output = ""

                    # 2. Debug code
                    if eda_ideas:
                        task_filepath, debug_code, code_output, score = self.debugger.generate_and_debug_code(
                            filename=filename,
                            pre_path=pre_path_to_save_passage,
                            submission_name="",
                            coder_implement_func=self.coder.implement_eda,
                            code_params=dict(
                                ideas=eda_ideas,
                                result_dir_path=self.config['path_log']
                            ),
                            agent_name="Coder (EDA)",
                            needs_invalid=False,
                            debug_speed_mode="standard"
                        )

                    if debug_code is None:
                        self.main_logger.info('Cannot generate EDA. Continue without EDA')
                        self.eda_output = ""
                        self.eda_images = None
                    else:
                        self.eda_images = None
                        eda_ideas_format = ""
                        for num, idea in enumerate(eda_ideas):
                            eda_ideas_format += f"{num + 1}. {idea}\n"
                        self.sub_logger.info("Start reasoner for analyze eda")
                        self.eda_output = self.reasoner.eda_analysis(ideas=eda_ideas_format, eda_output=code_output)

                    self.state = 'InitialState_FeatureEngineering'
                case 'FeatureEngineering':
                    # previous_ideas - The ideas of the previous stage.
                    # They are the parents of the nodes of the following
                    previous_ideas, _ = self.generate_nodes_at_the_stage(
                        filename=filename,
                        task_name=task_name,
                        pre_path=pre_path_to_save_passage,
                        eda_output=self.eda_output,
                        eda_images=self.eda_images
                    )
                    self.state = 'InitialState_Modeling'
                case 'Modeling':
                    if self.config['need_scoring_predict']:
                        # complex_ideas: [{'idea_description': idea description, 'score': idea score}, ...]

                        # ideas_with_score is an array of dictionaries describing ideas and their score.
                        # These ideas are launched to generate submissions and for get score
                        # The estimator will be based on them.

                        # cross_dataset_idea is one common idea of modeling that is taught with every idea of feature
                        # engineering. The result of the training will be submitted to the estimator.
                        if self.config['anchor_examples']:
                            self.sub_logger.info('-' * 20 + "Train complex ideas" + '-' * 20)
                            if self.config['dynamic_model']:
                                self.config['model_name'] = 'gemini-2.0-flash'
                            complex_ideas_with_score, cross_dataset_idea = self.generate_and_debug_complex_training(
                                pre_path=pre_path_to_save_passage,
                                eda_output=self.eda_output,
                                eda_images=self.eda_images,
                            )
                            self.cross_dataset_idea = cross_dataset_idea
                            self.complex_ideas_with_score = complex_ideas_with_score

                            self.sub_logger.info('-' * 20 + "Main MT nodes training" + '-' * 20)
                            if self.config['dynamic_model']:
                                self.config['model_name'] = 'gemini-2.5-flash'
                            indexes_modeling, scores = self.generate_nodes_at_the_stage(
                                filename=filename,
                                task_name=task_name,
                                pre_path=pre_path_to_save_passage,
                                eda_output=self.eda_output,
                                eda_images=None,
                                complex_ideas_with_score=self.complex_ideas_with_score,
                                cross_dataset_idea=self.cross_dataset_idea,
                                predict_score=True
                            )
                        else:
                            if self.config['dynamic_model']:
                                self.config['model_name'] = 'gemini-2.5-flash'
                            indexes_modeling, scores = self.generate_nodes_at_the_stage(
                                filename=filename,
                                task_name=task_name,
                                pre_path=pre_path_to_save_passage,
                                eda_output=self.eda_output,
                                eda_images=None,
                                predict_score=True
                            )
                    else:
                        if self.config['dynamic_model']:
                            self.config['model_name'] = 'gemini-2.5-flash'
                        indexes_modeling, scores = self.generate_nodes_at_the_stage(
                            filename=filename,
                            task_name=task_name,
                            pre_path=pre_path_to_save_passage,
                            eda_output=self.eda_output,
                            eda_images=None,
                            predict_score=False,
                            complex_ideas_with_score=None,
                            cross_dataset_idea=None
                        )

                    if indexes_modeling is not None:
                        # We keep the complete code of branches that worked correctly
                        final_codes = []
                        for idea_index, score in zip(indexes_modeling, scores):
                            code = self.insighter.insight_tree.get_all_code_in_branch(idea_index)
                            if self.config['need_format_pipeline']:
                                format_code = extract_python_code(self.coder.format_code(code))
                            else:
                                format_code = code

                            final_codes.append(format_code)
                            self.node_scores.append((idea_index, score))

                            baseline_diff = score - self.baseline_score
                            if baseline_diff > 0:
                                emoji = '📈'
                            else:
                                emoji = '📉'
                            self.sub_logger.info(
                                f"Idea index: {idea_index}\nScore: {score}\nDifference with baseline"
                                f" {round(baseline_diff, 4)} {emoji}"
                            )

                        for num_generation, final_code in enumerate(final_codes):
                            self.insighter.save_code_to_file(
                                final_code,
                                f'pipeline_code_generation_{num_generation}.py',
                                pre_path=pre_path_to_save_passage
                            )
                        previous_ideas = None
                        self.state = 'complete'

            self.previous_ideas = previous_ideas
            self.sub_logger.info(f"⚫\tFinish: {phase[1]}")
        else:
            # The logic of the remaining n passes, where n > 1
            match current_state:
                case 'AddingEDA':
                    self.adding_eda(passage_number)
                    self.state = 'Adding'
                case 'Adding':
                    self.adding(passage_number)
                    self.state = 'Merging'
                case 'Merging':
                    self.merging(passage_number)
                    self.state = 'CompletePassage'

            self.sub_logger.info(f"⚫\tFinish: {phase[0]}")
        write_running_time(start_work, self.config["path_debug_log"], f"{current_state}_{passage_number}")

    def generate_nodes_at_the_stage(
            self, filename: str, task_name: str, pre_path: str,
            complex_ideas_with_score: list | None = None,
            cross_dataset_idea: str | None = None,
            eda_output: str | None = None,
            eda_images: list | None = None,
            predict_score: bool = False
    ):
        """
        Depending on task_name, generate nodes at stages taking into account parent nodes

        :param filename: file name template in which the code will be saved
        :param task_name: stage name
        :param pre_path: prefix to the file storage path
        :param complex_ideas_with_score: [{'idea_description': idea description, 'score': idea score}, ...] or None
        :param cross_dataset_idea: one common idea of modeling that is taught with every idea of feature
        :param eda_output: text output from the EDA stage
        :param eda_images: images generated during the EDA phase
        :param predict_score: is it necessary to use the estimator (bool)
        :return: Tuple:
            - idea_indexes_add - nodes indexes that were generated for this stage
            - scores_add - the corresponding scores for these ideas
        """
        idea_indexes, scores = [], []
        if task_name == 'Model training':
            for parent_idea_number, parent_idea_index in enumerate(self.previous_ideas):
                self.sub_logger.info(f"⬛  Parent idea number: {parent_idea_number + 1}/{len(self.previous_ideas)}")
                idea_branch = self.insighter.insight_tree.get_branch(parent_idea_index)
                idea_indexes_add, scores_add = self.generate_and_debug_ideas(
                    filename=filename,
                    task_name=task_name,
                    pre_path=pre_path,
                    previous_ideas=idea_branch,
                    parent_idea_index=parent_idea_index,
                    eda_output=eda_output,
                    eda_images=None,
                    complex_ideas_with_score=complex_ideas_with_score,
                    cross_dataset_idea=cross_dataset_idea,
                    need_predict_score=predict_score,
                    is_it_complex_training=False
                )

                if len(self.insighter.insight_tree.nodes[parent_idea_index].children) == 0:
                    self.sub_logger.info(f"Remove {parent_idea_index} (not a single successful child)")
                    self.insighter.insight_tree.remove_node(parent_idea_index)
                idea_indexes.extend(idea_indexes_add)
                scores.extend(scores_add)

            return idea_indexes, scores
        elif task_name == 'Data preparation and feature engineering':
            idea_indexes_add, scores_add = self.generate_and_debug_ideas(
                filename=filename,
                task_name=task_name,
                pre_path=pre_path,
                previous_ideas=[],
                parent_idea_index=None,
                eda_output=eda_output,
                eda_images=eda_images,
                is_it_complex_training=False
            )
            return idea_indexes_add, scores_add

    def generate_and_debug_complex_training(self, pre_path: str,
                                            eda_output: str | None = None,
                                            eda_images: list | None = None, ):
        parent_idea_number = 0
        parent_idea_index = self.previous_ideas[parent_idea_number]
        idea_branch = self.insighter.insight_tree.get_branch(parent_idea_index)
        complex_ideas_with_score, cross_dataset_idea = self.generate_and_debug_ideas(
            filename='complex_training.py',
            task_name='Model training',
            pre_path=pre_path,
            previous_ideas=idea_branch,
            parent_idea_index=parent_idea_index,
            eda_output=eda_output,
            eda_images=eda_images,
            is_it_complex_training=True
        )
        return complex_ideas_with_score, cross_dataset_idea

    def generate_and_debug_ideas(
            self, filename: str, task_name: str, pre_path: str, previous_ideas: list,
            parent_idea_index: int | None = None,
            eda_output: str | None = None,
            eda_images: list | None = None,
            complex_ideas_with_score: list | None = None,
            cross_dataset_idea: str | None = None,
            need_predict_score: bool = False, is_it_complex_training: bool = False
    ):
        """
        Generate, implement and debug ideas at the stage or complex ideas

        if 'is_it_complex_training=True', then 'complex_ideas_with_score' and 'this_dataset_idea' must be None

        :param filename: file name template in which the code will be saved
        :param task_name: stage name
        :param pre_path: prefix to the file storage path
        :param previous_ideas: Previous ideas for this branch
        :param parent_idea_index: parent node index
        :param eda_output: text output from the EDA stage
        :param eda_images: images generated during the EDA phase
        :param complex_ideas_with_score: [{'idea_description': idea description, 'score': idea score}, ...] or None
        :param cross_dataset_idea: one common idea of modeling that is taught with every idea of feature
        :param need_predict_score: is it necessary to use the estimator (bool)
        :param is_it_complex_training: is this the stage of obtaining a score for complex_ideas (bool)
        :return: Depending on is_it_complex_training.
            - If is_it_complex_training=False,
            then idea_indexes and scores are returned—arrays of idea indexes and their corresponding scores.
            - If is_it_complex_training=True,
            then new_complex_ideas_with_score - generated format array complex_ideas_with_score and cross_dataset_insight
        """

        idea_indexes = []
        scores = []

        # if is_it_complex_training=True we form 'complex_ideas_with_score' and 'score_this_dataset'
        new_complex_ideas_with_score = []
        success_complex_ideas = []
        score_this_dataset = None

        # 1. Generating ideas:
        if is_it_complex_training:
            # Complex ideas
            need_predict_score = False
            ideas, number_of_ideas, cross_dataset_idea = self.insighter.generate_competitive_insights(
                eda_output=eda_output,
                eda_images=eda_images
            )
            timeout = self.config['max_minutes_to_run_for_complex_training']
        else:
            # Ideas at the stage
            timeout = self.config['runtime_error_time']
            ideas, number_of_ideas = self.insighter.generate_phase_ideas(
                task_name=task_name,
                previous_ideas=previous_ideas,
                eda_output=eda_output,
                eda_images=eda_images
            )
            if ideas is None:
                return [], []

        # 2. Form filename ans define prev_code
        filename = filename.strip(".py")
        current_index = self.insighter.insight_tree.current_index
        if parent_idea_index is not None:
            prev_code = self.insighter.insight_tree.get_all_code_in_branch(parent_idea_index)
            filename += f'_parent_{parent_idea_index}'
        else:
            prev_code = "No. You're in stage one"

        # 3. Train cross_dataset_idea on this instance of the dataset
        if need_predict_score and cross_dataset_idea:
            curr_model_name = self.config['model_name']
            try:
                # Implementing idea
                self.sub_logger.info("-" * 10 + f" Idea for score prediction " + "-" * 10)
                if self.config['dynamic_model']:
                    self.config['model_name'] = 'gemini-2.0-flash'
                task_filepath, code_for_score, _, score_this_dataset = self.debugger.generate_and_debug_code(
                    filename=f'{filename}_idea_for_score_prediction.py',
                    pre_path=pre_path,
                    submission_name=f"my_submission_{current_index}.csv",
                    coder_implement_func=self.coder.implement_task,
                    code_params=dict(
                        idea=cross_dataset_idea,
                        previous_code=prev_code,
                        task_name=task_name,
                        eda_output=eda_output,
                        eda_images=eda_images,
                        node_index=current_index,
                        parent_index=parent_idea_index
                    ),
                    agent_name="Coder",
                    needs_invalid=True
                )
                if code_for_score:
                    # Bind cross_dataset_idea to the dataset (it will be used later at the adding and merging stage)
                    self.sub_logger.info(f"Score this dataset: {score_this_dataset}")
                    self.insighter.insight_tree.nodes[parent_idea_index].score_for_prediction = {
                        'idea': cross_dataset_idea,
                        'score': score_this_dataset
                    }
                else:
                    score_this_dataset = None
            # If we can't debug cross_dataset_idea, skip it
            except Exception as err:
                self.sub_logger.info(f"An error occurred while predicting the score: {err}")
                score_this_dataset = None
            finally:
                self.config['model_name'] = curr_model_name

        # 4. Loop through all generated ideas
        for idea_number, idea in enumerate(ideas):
            self.sub_logger.info(f"⬛\tIdea number: {idea_number + 1}/{number_of_ideas}\t{idea}")
            node_index = self.insighter.insight_tree.current_index
            new_filename = f'{filename}_node_{node_index}.py'

            predicted_score = None
            score = None
            if need_predict_score:
                # Generate code for get predict from scoring model
                task_new_code = self.coder.implement_task(
                    idea=idea,
                    previous_code=prev_code,
                    task_name=task_name,
                    eda_output=eda_output,
                    eda_images=eda_images,
                    node_index=node_index,
                    parent_index=parent_idea_index
                )

                if task_new_code is None:
                    # If no code could be generated for a given idea, skip it
                    self.sub_logger.info("Skip the idea")
                    continue

                task_filepath = self.coder.save_code_to_file(task_new_code, new_filename, pre_path)
                # Generate a description for the code (necessary for more accurate work of estimate_agent)
                description = self.estimator.generate_description(task_new_code)

                # Score prediction and debug on accelerated version of the code (1 epochs/iteration/etc. for training)
                debug_code, predicted_score = self.estimator.predict_score_and_debug(
                    examples_other=complex_ideas_with_score,
                    example_this={'description': cross_dataset_idea, 'score': score_this_dataset},
                    description=description,
                    code=task_new_code,
                    node_index=node_index,
                    new_filename=new_filename,
                    pre_path=pre_path,
                )
                if debug_code is not None:
                    task_filepath = self.coder.save_code_to_file(debug_code, new_filename, pre_path)

                self.sub_logger.info(f'Predicted score: {predicted_score}')
                if predicted_score is not None and self.config['is_scoring_model_test'] and bool(task_name == "Model training"):
                    self.sub_logger.info("Training to test the correctness of the scoring model")
                    submission_name = f"my_submission_{node_index}.csv"
                    debug_code_real, code_output_real, score = self.debugger.run_code(
                        task_filepath,
                        submission_path=os.path.join(self.config['path_log'], "submissions", submission_name),
                        needs_invalid=True
                    )
                    self.sub_logger.info(f'Real score: {score}')
            else:
                # If we do not predict score just debug branch
                task_filepath, debug_code, code_output, score = self.debugger.generate_and_debug_code(
                    filename=new_filename,
                    pre_path=pre_path,
                    submission_name=f"my_submission_{node_index}.csv",
                    coder_implement_func=self.coder.implement_task,
                    code_params=dict(
                        idea=idea,
                        previous_code=prev_code,
                        task_name=task_name,
                        eda_output=eda_output,
                        eda_images=eda_images,
                        node_index=node_index,
                        parent_index=parent_idea_index
                    ),
                    agent_name="Coder",
                    needs_invalid=bool(task_name == "Model training"),
                    timeout=timeout
                )

            # If we cannot debug code or predict score just skip idea
            if debug_code is not None and (score is not None or bool(task_name != "Model training") or predicted_score is not None):
                if not is_it_complex_training:
                    index = self.insighter.insight_tree.add_idea(idea, debug_code, parent_idea_index)
                    if self.config['is_scoring_model_test'] and bool(
                            task_name == "Model training") and need_predict_score:
                        self.insighter.insight_tree.nodes[index].predicted_score = predicted_score
                        self.insighter.insight_tree.nodes[index].description = description
                    idea_indexes.append(index)
                    if predicted_score is not None:
                        scores.append(predicted_score)
                    else:
                        scores.append(score)
                else:
                    success_complex_ideas.append(idea)
                    new_complex_ideas_with_score.append({
                        'idea_description': self.estimator.generate_description(debug_code), 'score': score,
                        'code_output': code_output
                    })
            else:
                if task_filepath is not None:
                    os.remove(task_filepath)
                self.sub_logger.info("Skip the idea")
            time.sleep(self.config['insight_delay'])

        if is_it_complex_training:
            if cross_dataset_idea not in success_complex_ideas and success_complex_ideas:
                cross_dataset_idea = success_complex_ideas[0]
            return new_complex_ideas_with_score, cross_dataset_idea
        else:
            return idea_indexes, scores

    def adding_eda(self, passage_number: int):
        self.main_logger.info("Adding EDA")
        pre_path = os.path.join(self.config['path_log'], 'code', f'passage_number_{passage_number}')
        path_tree_info = os.path.join(pre_path, 'tree_info.json')
        tree = self.insighter.insight_tree

        modeling_nodes = [
            node_index for node_index in tree.nodes
            if tree.nodes[node_index] and tree.nodes[node_index].depth == 2 \
               and tree.nodes[node_index].mean_score is not None
        ]
        if self.is_higher_better:
            modeling_nodes.sort(key=lambda node_index: -tree.nodes[node_index].mean_score)
        else:
            modeling_nodes.sort(key=lambda node_index: tree.nodes[node_index].mean_score)

        if len(modeling_nodes) > 2 * self.config["top_n_for_eda"]:
            modeling_nodes = modeling_nodes[:self.config["top_n_for_eda"]] + modeling_nodes[
                                                                             -self.config["top_n_for_eda"]:]

        parents_node = defaultdict(list)
        for node in modeling_nodes:
            parents_node[tree.nodes[node].parent].append(node)
        parents_node = dict(parents_node)

        introduce_tree = {}
        for parent_node in parents_node:
            children_info = []
            for children_index in parents_node[parent_node]:
                children_info.append({
                    children_index: {
                        "Score": tree.nodes[children_index].mean_score,
                        "Idea": tree.nodes[children_index].idea,
                    }
                })
            introduce_tree[parent_node.index] = {
                "Parent idea": parent_node.idea,
                "Parent score": parent_node.mean_score,
                "Children info": children_info
            }

        with open(path_tree_info, 'w', encoding='utf-8') as f:
            json.dump(introduce_tree, f, indent=4, ensure_ascii=False)

        self.sub_logger.info("Do we need to add EDA...?")
        need_eda, new_eda_idea = self.reasoner.do_need_to_add_eda(
            tree_info_path=path_tree_info, is_higher_better=self.is_higher_better
        )
        if need_eda:
            task_filepath, debug_code, code_output, score = self.debugger.generate_and_debug_code(
                filename=f"eda_{passage_number}.py",
                pre_path=os.path.join('code', f'passage_number_{passage_number}'),
                submission_name="",
                coder_implement_func=self.coder.implement_eda,
                code_params=dict(
                    ideas=new_eda_idea,
                    result_dir_path=self.config['path_log']
                ),
                agent_name="Coder (EDA)",
                needs_invalid=False,
                debug_speed_mode="standard"
            )
            if debug_code is None:
                self.sub_logger.info('Cannot generate new EDA')
            else:
                self.sub_logger.info("✅ Updating EDA")
                self.eda_output = self.reasoner.merge_eda(
                    eda_output=code_output, idea=new_eda_idea, merge_number=passage_number
                )
        else:
            self.sub_logger.info("❌ The agent decided not to add EDA")

    def adding(self, passage_number: int):
        """
        Perform the adding stage

        :param passage_number: int - tree passage number
        :return: None
        """
        pre_path_adding = os.path.join(
            'code', f'passage_number_{passage_number}', f'adding_passage_{passage_number}'
        )
        self.main_logger.info("Adding")

        tree = self.insighter.insight_tree
        last_indexes = [
            node_index for node_index in tree.nodes
            if tree.nodes[node_index] and tree.nodes[node_index].depth == 2
        ]
        added_indexes = []
        scores = []

        # We go through the phases from the highest level (Data preparation and feature engineering) downwards:
        # 1. Data preparation and feature engineering
        # 2. Modeling
        for phase_idea_index in range(len(self.config['phases'][:-1]) - 1, -1, -1):
            task_name, filename, _ = self.config['phases'][phase_idea_index]
            ideas_with_previous_code = self.adding_algorithm.add_new_ideas(
                task_name=task_name,
                node_indexes_on_the_phase=last_indexes,
                eda_images=self.eda_images,
                eda_output=self.eda_output
            )
            new_added_indexes, new_scores = self.implement_and_debug_adding_idea(
                task_name=task_name, filename=filename, phase_index=phase_idea_index,
                ideas_with_previous_code=ideas_with_previous_code, pre_path_adding=pre_path_adding
            )

            added_indexes += new_added_indexes
            scores += new_scores

        # Back propagation for new ideas
        for i in range(len(added_indexes)):
            self.insighter.insight_tree.backprop(added_indexes[i], scores[i], self.debug_logger)

    def implement_and_debug_adding_idea(
            self, task_name: str, filename: str, phase_index: int,
            ideas_with_previous_code: dict, pre_path_adding: str
    ):
        """
        Implements ideas generated during the adding stage:
            1. For Data preparation and feature engineering, generates children of the Modeling stage
            2. For Modeling, implements, debug, and obtains score

        :param task_name: stage name
        :param filename: file name template in which the code will be saved
        :param phase_index: index of the phase under consideration
        :param ideas_with_previous_code: a dictionary where the keys are parent indexes
                                         and the values are dictionaries of ideas with code
        :param pre_path_adding: prefix to the file storage path
        :return: indexes of new ideas and their score
        """
        new_added_indexes = []
        new_scores = []
        filename = filename.strip(".py")
        for parent_index in ideas_with_previous_code:
            # for Data preparation and feature engineering parent_index = -1
            # and is not taken into account in the rest of the code
            if parent_index != -1:
                parent_filename = f"{filename}_paranet_{parent_index}"
            else:
                parent_filename = filename

            ideas = ideas_with_previous_code[parent_index]["idea"]
            previous_code = ideas_with_previous_code[parent_index]["previous_code"]
            group = ideas_with_previous_code[parent_index]["group"]
            for idea_nummer, idea in enumerate(ideas[:self.config['max_add_idea']]):
                current_index = self.insighter.insight_tree.current_index
                node_filename = f"{parent_filename}_node_{current_index}.py"
                self.sub_logger.info(f"{idea_nummer + 1}. {idea}")
                if parent_index == -1:
                    parent_index_set = None
                else:
                    parent_index_set = parent_index

                task_filepath, debug_code, _, score = self.debugger.generate_and_debug_code(
                    filename=node_filename,
                    pre_path=pre_path_adding,
                    submission_name=f"my_submission_{current_index}.csv",
                    coder_implement_func=self.coder.implement_task,
                    code_params=dict(
                        idea=idea,
                        previous_code=previous_code,
                        task_name=task_name,
                        eda_output=self.eda_output,
                        eda_images=self.eda_images,
                        node_index=current_index,
                        parent_index=parent_index
                    ),
                    agent_name="Coder",
                    needs_invalid=bool(task_name == "Model training")
                )

                if debug_code is not None:
                    index_add_idea = self.insighter.insight_tree.add_idea(
                        idea, debug_code, parent_index=parent_index_set
                    )
                    self.insighter.insight_tree.set_group_for_node(group, index_add_idea)
                    indexes_new = [index_add_idea]
                    scores_new = [score]
                    task_index_new = phase_index

                    # 4. Generates the rest of the tree for non-final vertices
                    while task_index_new != 0:
                        task_index_new -= 1  # We descend to the level below
                        task_name_new, filename_new, _ = self.config['phases'][task_index_new]
                        self.previous_ideas = indexes_new
                        indexes_new, scores_new = self.generate_nodes_at_the_stage(
                            filename=filename_new,
                            task_name=task_name_new,
                            pre_path=pre_path_adding,
                            eda_output=self.eda_output,
                            eda_images=self.eda_images,
                            complex_ideas_with_score=self.complex_ideas_with_score,
                            cross_dataset_idea=self.cross_dataset_idea,
                            predict_score=self.config['need_scoring_predict']
                        )

                    new_added_indexes += indexes_new
                    new_scores += scores_new
                else:
                    if task_filepath is not None:
                        os.remove(task_filepath)
        return new_added_indexes, new_scores

    def merging(self, passage_number: int):
        """
        Perform the merging stage

        :param passage_number: int - tree passage number
        :return: None
        """
        pre_path_merging = os.path.join(
            'code', f'passage_number_{passage_number}', f'merge_passage_{passage_number}'
        )
        self.main_logger.info("Merging")

        tree = self.insighter.insight_tree
        last_indexes = [
            node_index for node_index in tree.nodes
            if tree.nodes[node_index] and tree.nodes[node_index].depth == 2
        ]

        merge_indexes = self.merging_algorithm.merge_ideas(
            pre_path_merging,
            last_indexes,
            baseline_score=self.baseline_score
        )

        # Backprop 1
        for merge_index in merge_indexes[0]:
            self.insighter.insight_tree.backprop(
                merge_index,
                self.insighter.insight_tree.nodes[merge_index].mean_score,
                self.debug_logger,
                need_update_score_for_this_node=False
            )
        self.previous_ideas = merge_indexes[1]

        task_name, filename, _ = self.config['phases'][0]
        self.sub_logger.info(f"\t 🔷 Add new node")
        merge_indexes_new, scores = self.generate_nodes_at_the_stage(
            filename=filename,
            task_name=task_name,
            pre_path=pre_path_merging,
            eda_output=self.eda_output,
            eda_images=self.eda_images,
            complex_ideas_with_score=self.complex_ideas_with_score,
            cross_dataset_idea=self.cross_dataset_idea,
            predict_score=self.config['need_scoring_predict']
        )
        # Backprop 2
        for i in range(len(merge_indexes_new)):
            self.insighter.insight_tree.backprop(merge_indexes_new[i], scores[i], self.debug_logger)

    def backprop(self):
        """
        Updates the average speed of vertices in the branch
        :return: None
        """
        if not self.node_scores:
            self.main_logger.info("node_scores is empty")
            self.state = "error"
            return

        for node_ind, score in self.node_scores:
            self.insighter.insight_tree.backprop(node_ind, score, self.debug_logger)

    def reflect(self, passage_number: int):
        """
        Collect all vertices at the final stage, take the top N by score,
        and run them on a test sample

        :param passage_number: int - tree passage number
        :return:
        """
        start_work = time.time()
        tree = self.insighter.insight_tree
        pre_path_to_save_results_of_passage = os.path.join('results', f'passage_number_{passage_number}')

        modeling_nodes = [
            node_index for node_index in tree.nodes
            if tree.nodes[node_index] and tree.nodes[node_index].depth == 2 \
               and tree.nodes[node_index].mean_score is not None
        ]
        if self.is_higher_better:
            modeling_nodes.sort(key=lambda x: -tree.nodes[x].mean_score)
        else:
            modeling_nodes.sort(key=lambda x: tree.nodes[x].mean_score)

        self.main_logger.info("Reflection began")
        selected_node_indexes = modeling_nodes[:self.config['top_N_for_running_on_test']]
        node_indexes_on_test = {}
        for ind, select_node_index in enumerate(selected_node_indexes):
            self.sub_logger.info(f"Node {ind + 1}/{len(selected_node_indexes)}")
            code = self.coder.format_code(
                self.insighter.insight_tree.get_all_code_in_branch(select_node_index)
            )
            submission_name = f"test_submission_{select_node_index}.csv"
            submission_file_path = os.path.join(self.config['path_log'], pre_path_to_save_results_of_passage,
                                                submission_name)

            code_with_test_data = replace_dirs(
                code,
                data_dir=self.config['data_dir_path'],
                result_dir=pre_path_to_save_results_of_passage,
                submission_subdir=submission_name
            )

            code_with_test_data = extract_python_code(self.coder.replace_paths(
                code=code_with_test_data,
                train_csv_path=os.path.join(self.config['data_dir_path'], 'train.csv'),
                test_csv_path=os.path.join(self.config['data_dir_path'], 'test.csv'),
                output_dir=os.path.join(self.config["path_log"], pre_path_to_save_results_of_passage),
                submission_filename=submission_name,
                base_dir=self.config['data_dir_path']
            ))
            filepath_save = self.coder.save_code_to_file(
                code_with_test_data, f"node_{select_node_index}_in_test_data.py",
                pre_path=pre_path_to_save_results_of_passage
            )
            code, _, score = self.debugger.run_code(
                filepath_save,
                submission_file_path,
                needs_invalid=True,
                test_submit_file_path=os.path.join(self.config['data_dir_path'], "sample_submission.csv"),
                timeout=60
            )

            if not self.config['need_test_score']:
                continue
            if code is not None:
                test_submission_file_path = os.path.join(self.config['data_dir_path'], "test_labeled.csv")
                code_output, error = execute_code(
                    os.path.join(self.config['data_dir_path'], "count_metric.py"),
                    args=["--test_path", test_submission_file_path, "--predict_path", submission_file_path],
                    log_file=self.config["path_debug_log"], agent_name="reflect", timeout=60
                )
                if error is None:
                    node_indexes_on_test[select_node_index] = {
                        "test_score": code_output,
                        "file_with_code": filepath_save
                    }
                    self.sub_logger.info(f"Test score: {code_output}")
                else:
                    self.sub_logger.info(f"Error: {error}")
            else:
                self.sub_logger.info(f"I couldn't debug the code.")

        write_running_time(start_work, self.config["path_debug_log"], f"reflect_{passage_number}")
        return node_indexes_on_test, os.path.join(self.config["path_log"], pre_path_to_save_results_of_passage)

    def generate_report(self, passage_number: int | str):
        # 1. Output the tree
        results_path_tree = os.path.join(self.config['path_log'], "results", f"insights_tree_json")
        os.makedirs(results_path_tree, exist_ok=True)
        tree_path = os.path.join(results_path_tree, f"insights_tree_{passage_number}.json")
        self.insighter.insight_tree.to_json(file_path=tree_path)

        # 2. Generate graphs
        results_path = os.path.join(self.config['path_log'], "results", f"passage_number_{passage_number}")
        os.makedirs(results_path, exist_ok=True)
        generate_all_plots(
            llm_tokens_file=os.path.join(self.config['path_debug_log'], "tokens.csv"),
            agent_time_file=os.path.join(self.config['path_debug_log'], "times.csv"),
            debug_logs_file=os.path.join(self.config['path_debug_log'], "debug_metrics.csv"),
            checker_agent_file=os.path.join(self.config['path_debug_log'], "checker_metrics.csv"),
            path_to_save=results_path
        )

        if passage_number == "final":
            self.reasoner.final_analysis(tree_path=tree_path)
        self.sub_logger.info("✅ Reports successfully generated!")

    def finish(self):
        """
        Generate a report on the pipeline

        :return:
        """
        # 1. Generate reports
        self.insighter.insight_tree.parse_final_nodes_to_json(path=self.config["path_log"])
        self.generate_report("final")

        # 2. Run final solution
        tree = self.insighter.insight_tree

        modeling_nodes = [
            node_index for node_index in tree.nodes
            if tree.nodes[node_index] and tree.nodes[node_index].depth == 2 \
               and tree.nodes[node_index].mean_score is not None
        ]
        if not modeling_nodes:
            best_node = "baseline"
            with open(os.path.join(self.config['path_log'], "code", "baseline.py"), "r") as f:
                code = f.read()
            idea = "Create baseline solutions"
            self.main_logger.info(f"Select baseline (score = {self.baseline_score})")
        else:
            if self.is_higher_better:
                best_node = sorted(
                    modeling_nodes, key=lambda x: -tree.nodes[x].mean_score
                )[0]
            else:
                best_node = sorted(
                    modeling_nodes, key=lambda x: tree.nodes[x].mean_score
                )[0]
            code = self.coder.format_code(
                self.insighter.insight_tree.get_all_code_in_branch(best_node)
            )
            idea = tree.nodes[best_node].idea
            self.main_logger.info(f"Select node {best_node} (score = {tree.nodes[best_node].mean_score})")

        submission_name = f"FINAL_SUBMIT_{best_node}.csv"
        submission_file_path = os.path.join(
            self.config['path_log'], "submissions", submission_name
        )

        code_with_test_data = replace_dirs(
            code,
            data_dir=self.config['data_dir_path'],
            result_dir=self.config['path_log'],
            submission_subdir=submission_name
        )

        code_with_test_data = extract_python_code(self.coder.final_processing(
            code=code_with_test_data,
            train_csv_path=os.path.join(self.config['data_dir_path'], 'train.csv'),
            test_csv_path=os.path.join(self.config['data_dir_path'], 'test.csv'),
            output_dir=self.config["path_log"],
            submission_filename=submission_name,
            base_dir=self.config['data_dir_path'],
            idea=idea
        ))
        filepath_save = self.coder.save_code_to_file(
            code_with_test_data, f"FINAL_CODE_{best_node}.py",
            pre_path=''
        )
        code, _, score = self.debugger.run_code(
            filepath_save,
            submission_file_path,
            needs_invalid=True,
            test_submit_file_path=os.path.join(self.config['data_dir_path'], "sample_submission.csv"),
            timeout=120
        )
