import json
import os
from copy import deepcopy

import gymnasium as gym
import numpy as np
from minigrid.utils.baby_ai_bot import BabyAIBot

# from babyai.levels.verifier import PickupInstr, ObjDesc
from babyai_utils import LanguageObsWrapper
from eval import Evaluator
from graph_creator2 import GraphCreator
# from subgoal_graph import build_tree_with_treelib, postorder_traversal, reverse_order_of_children, preorder_traversal

import random

from mistake_handling_bot import ErikBot


# Create the environment


def get_valid_env(env):
    valid = False
    state = None
    while not valid:
        np.random.seed = 1
        # env = gym.make(f'BabyAI-{env_name}', render_mode='human')
        state, info = env.reset()
        mission = state["mission"]

        if 'front' in mission or 'behind' in mission or 'right' in mission or 'left' in mission:
            valid = False
        else:
            valid = True

        if env.is_object_next_to_door():
            valid = False

        if env.same_objects():
            valid = False

    backup_env = deepcopy(env)
    backup_state = deepcopy(state)
    return state, backup_env, backup_state

def falsify_plan(plan, obj):
    falsified_plan = deepcopy(plan)

    actions = ["Open", "Pickup", "Drop", "Go next to", "Close"]
    if random.random() < 1:
        # 50% chance to add or remove an action
        if random.random() < 0.5:
            # Add a random action
            action = random.choice(actions)
            new_action = f"{action} {obj[0]} {obj[1]}"
            insert_position = random.randint(0, len(falsified_plan)-1)
            falsified_plan.insert(insert_position, new_action)
        else:
            # Remove a random action
            if falsified_plan:
                remove_position = random.randint(0, len(falsified_plan) - 2)
                falsified_plan.pop(remove_position)

    return falsified_plan


def create_data(env_name, num_samples=1, save=True):
    seed = int(random.random() * 100000)
    # env = gym.make(f'BabyAI-{env_name}', render_mode='human')
    env = gym.make(f'BabyAI-{env_name}')
    env = LanguageObsWrapper(env)

    data_entries = []

    # Run the loop for steps#
    evaluator = Evaluator()
    for episode in range(num_samples):
        # try:
            observation, new_env, new_state = get_valid_env(env)
            evaluator.set_env(env)
            evaluator.state = observation
            # env.env.env.env.env.instrs = PickupInstr(ObjDesc('key', 'blue'))
            a=5
            agent=ErikBot(env)
            # exit()
            graph = GraphCreator()
            mission = observation["mission"]
            level = observation["language"]
            print("Mission:", observation["mission"])
            print("Observation: ", observation["language"])
            done = False
            total_reward = 0
            action = None

            while not done:
                action = agent.replan(action_taken=action)
                # print(action)
                # print("Action: ", action)
                observation, reward, terminated, truncated, info = env.step(action)
                graph.add_stack(agent.stack)
                # print(agent.stack)
                done = terminated or truncated
                total_reward += reward
                env.render()

            tree, plan, poss_act = graph.print()

            new_evaluator = Evaluator()
            new_evaluator.set_env(new_env)
            print("Mission:", new_state["mission"])
            print("Level:", new_state["language"])
            falsified_plan = falsify_plan(plan, agent.get_random_obj())
            print("_____")
            print("Falsified plan")
            for i in falsified_plan:
                print(i)

            print("_____")
            print("Test Plan")
            plan = new_evaluator.check_plan_for_mistake(falsified_plan)
            for i in plan:
                print(i)

            print("_____")

            # plan to recover

            new_agent = BabyAIBot(new_env)
            print(new_agent.stack)
            done = False
            total_reward = 0
            action = None
            new_graph = GraphCreator()
            while not done:
                poss_act = agent.get_possible_actions()
                action = new_agent.replan(action_taken=action)
                # print(action)
                # print("Action: ", action)
                observation, reward, terminated, truncated, info = new_env.step(action)
                new_graph.add_stack(agent.stack, poss_act)
                # print(agent.stack)
                done = terminated or truncated
                total_reward += reward
                env.render()

            tree, plan = new_graph.print()

            data_entry = {
                "mission": mission,
                "level": level,
                "plan": plan,
                "tree": tree,
            }
            data_entries.append(data_entry)
            # if not os.path.exists(f"data/{env_name}"):
            #     os.makedirs(f"data/{env_name}")
            # create jsonl
            env.close()
            if save:
                with open(f"data/{env_name}.jsonl", "w") as f:
                    for data_entry in data_entries:
                        f.write(json.dumps(data_entry, ensure_ascii=False))
                        f.write("\n")
            else:
                return data_entries
        # except Exception as e:
        #     print(e)
        #     pass

if __name__ == "__main__":
    create_data("MiniBossLevel", 20000)

