from agents.base_agent import BaseAgent_openai
from prompts.reader_agent_prompts import READ_INSTRUCTION
import pandas as pd
import os
from utils.extractors import extract_markdown


class ReaderAgentAPI(BaseAgent_openai):
    def read_data(self):
        """
        Read and return the first lines of the source files in the dataset

        :return: text from "overview.txt", train_file.head(), train_file.describe(), sample_submission_file.head()
        """
        path_to_desc_file = os.path.join(self.config['data_dir_path'], "overview.txt")

        train_file = pd.read_csv(os.path.join(self.config['data_dir_path'], "train.csv"))
        sample_submission_file = pd.read_csv(os.path.join(self.config['data_dir_path'], "sample_submission.csv"))
        with open(path_to_desc_file, 'r') as f:
            return '\n'.join(f.readlines()), train_file.head(), train_file.describe(), sample_submission_file.head()

    def get_dataset_description(self):
        """
        Create a file with contextual information about the dataset

        :return: An error occurred (bool), description file path
        """
        self.clear_context()
        self.agent_name = 'reader'

        dir_path = self.config['data_dir_path']
        description, train_head, train_describe, sample_submission_file = self.read_data()

        self.instructions = READ_INSTRUCTION.format(
            description=description, train_head=train_head,
            sample_submission_file=sample_submission_file,
            train_description=train_describe, dataset_path=dir_path
        )

        result = self.code_generation_from_several_attempts(self.config['number_of_attempts_reader'])
        if result is None:
            return True, None

        description_file_path = self.save_code_to_file(extract_markdown(result), 'description.md', pre_path='')
        return False, description_file_path
