from abc import abstractmethod

import gymnasium as gym

from config import *
from tqdm import tqdm
from together import Together
from Testers.Test import LMFeedbackVerifier
from abc import ABC, abstractmethod
import json, requests
from hcraft.examples import MineHcraftEnv
from hcraft.examples.minecraft.items import DIAMOND
from hcraft.task import GetItemTask



from hcraft.transformation import InventoryOwner, InventoryOperation
def remove_underscore(str):
    return str.replace("_", " ")
def get_quantity_and_name(inventory_change):
    return str(inventory_change.quantity) + " " + remove_underscore(inventory_change.item.name)
def generate_craft_recipe(transformation, template="You can craft {item} with {requirements}."):
    item_str = [get_quantity_and_name(inventory_change) for inventory_change in transformation.inventory_changes[InventoryOwner("player")][InventoryOperation.ADD]]
    item_str = ", ".join(item_str)
    requirements_str = [get_quantity_and_name(inventory_change) for inventory_change in transformation.inventory_changes[InventoryOwner("player")][InventoryOperation.REMOVE]]
    requirements_str = ", ".join(requirements_str)
    return template.format(item=item_str, requirements=requirements_str)
smelt_tmplt = "You can get {item} after smelting with {requirements}."
craft_tmplt = "You can craft {item} with {requirements}."

def generate_move_to_str(transformation, template="You can move to {destination} from {place}."):
    # print(transformation)
    zone_str = transformation.zone.name
    destination_str = transformation.destination.name
    return template.format(place=zone_str, destination=destination_str)


def generate_search_recipe(transformation, template="You can collect {item} at {place}."):
    item_str = [get_quantity_and_name(inventory_change) for inventory_change in transformation.inventory_changes[InventoryOwner("player")][InventoryOperation.ADD]]
    item_str = ", ".join(item_str)
    try:
        remove_str = [get_quantity_and_name(inventory_change) for inventory_change in transformation.inventory_changes[InventoryOwner("player")][InventoryOperation.REMOVE]]
        remove_str = ", ".join(remove_str)
    except:
        remove_str = ""
    try:
        min_str = [get_quantity_and_name(inventory_change) for inventory_change in transformation.inventory_changes[InventoryOwner("player")][InventoryOperation.MIN]]
        min_str = ", ".join(min_str)
    except:
        min_str = ""
    zone_str = transformation.zone.name

    if min_str != "":
        final_str = "You need to have at least " + min_str + " to collect " + item_str + " at " + zone_str + "."
    else:
        final_str = template.format(item=item_str, place=zone_str)
    if remove_str != "":
        final_str += " " + remove_str + " will be consumed."
    return final_str

def hcraft_obs_extractor(data, condition_list):
    return data["state"]


def replace_symbols_from_str_to_space(input_str, removed_symbol=["-", "_"]):
    for symbol in removed_symbol:
        input_str = input_str.replace(symbol, " ")
    return input_str

def transformation_to_str(transformation):
    i = transformation
    if not "crafting" in i.name:
        if "smelt" in i.name:
            rule_str = generate_craft_recipe(i, template=smelt_tmplt) + "\n"
        if "craft" in i.name:
            rule_str = generate_craft_recipe(i, template=craft_tmplt) + "\n"
        if "search" in i.name:
            rule_str = generate_search_recipe(i) + "\n"
        if "move" in i.name and "with" not in i.name and "end" not in i.name and "stronghold" not in i.name and "nether" not in i.name:
            rule_str = generate_move_to_str(i) + "\n"
    return rule_str

def construct_legal_action_rules(env, legal_actions, exlucded_actions=[63,
 13,
 14,
 15,
 0,
 25,
 100,
 29,
 163,
 119,
 160,
 154,
 148,
 95,
 16,
 1,
 9,
 33,
 178,
 126]):
    """

    :param env:
    :param legal_actions:
    :param exlucded_actions: by default we exclude the actions in the expert path
    :return:
    """
    rules = ""
    for action in legal_actions:
        i = env.world.transformations[action]
        rule_str = ""
        if action not in exlucded_actions:
            if not "crafting" in i.name:
                if "smelt" in i.name:
                    rule_str = generate_craft_recipe(i, template=smelt_tmplt) + "\n"
                if "craft" in i.name:
                    rule_str = generate_craft_recipe(i, template=craft_tmplt) + "\n"
                if "search" in i.name:
                    rule_str = generate_search_recipe(i) + "\n"
                if "move" in i.name and "with" not in i.name and "end" not in i.name and "stronghold" not in i.name and "nether" not in i.name:
                    rule_str = generate_move_to_str(i) + "\n"
            rules += i.name + ": " + rule_str
    return rules






class HierachyCraftVerifier(LMFeedbackVerifier):
    def __init__(self, env, feedback_type, data_path, condition_list, **kargs):
        super().__init__(env, feedback_type, data_path, condition_list, **kargs)
        self.use_action_map_dict = True
        self.obs_representation_extractor = hcraft_obs_extractor
        self.goal = GetItemTask(DIAMOND)
        env = MineHcraftEnv(purpose=self.goal)
        env.reset()
        self.env_instance = env
        self.number_to_action_dict = {index: value for index, value in enumerate([replace_symbols_from_str_to_space(i.name) for i in env.state.world.transformations])}
        self.action_to_number_dict = {value.upper(): index for index, value in enumerate([replace_symbols_from_str_to_space(i.name) for i in env.state.world.transformations])}
        if feedback_type == "action_advising":
            self.feedback_type_to_translation_dict = self.action_to_number_dict

        self.base_prompt = "You are playing MineCraft and you want to craft diamond."

        if "known_dynamics" in condition_list:
            self.base_prompt += """
Below are the rules for the minecraft.
You need a crafting table to craft something.
You need a furnace to smelt something.
You can pick up a crafting table or a furnace and take them around. You need to place one in your current area if you want to use them.
You can get 3 iron ingot after smelting with 3 iron ore, 2 wood plank.
You can get 3 gold ingot after smelting with 3 gold ore, 2 wood plank.
You can get 8 iron ingot after smelting with 8 iron ore, 1 coal.
You can get 8 gold ingot after smelting with 8 gold ore, 1 coal.
You can craft 4 wood plank with 1 wood.
You can craft 4 stick with 2 wood plank.
You can craft 1 furnace with 8 cobblestone.
You can craft 3 paper with 3 reeds.
You can craft 1 book with 3 paper, 1 leather.
You can craft 1 enchanting table with 1 book, 4 obsidian, 2 diamond.
You can craft 1 clock with 4 gold ingot, 1 redstone.
You can craft 1 flint with 10 gravel.
You can craft 4 flint and steel with 1 iron ingot, 1 flint.
You can craft 2 blaze powder with 1 blaze rod.
You can craft 1 ender eye with 1 blaze powder, 1 ender pearl.
You can craft 10 wood pickaxe with 3 wood plank, 2 stick.
You can craft 10 wood axe with 3 wood plank, 2 stick.
You can craft 10 wood shovel with 1 wood plank, 2 stick.
You can craft 10 wood sword with 2 wood plank, 1 stick.
You can craft 20 stone pickaxe with 3 cobblestone, 2 stick.
You can craft 20 stone axe with 3 cobblestone, 2 stick.
You can craft 20 stone shovel with 1 cobblestone, 2 stick.
You can craft 20 stone sword with 2 cobblestone, 1 stick.
You can craft 40 iron pickaxe with 3 iron ingot, 2 stick.
You can craft 40 iron axe with 3 iron ingot, 2 stick.
You can craft 40 iron shovel with 1 iron ingot, 2 stick.
You can craft 40 iron sword with 2 iron ingot, 1 stick.
You can craft 10 gold pickaxe with 3 gold ingot, 2 stick.
You can craft 10 gold axe with 3 gold ingot, 2 stick.
You can craft 10 gold shovel with 1 gold ingot, 2 stick.
You can craft 10 gold sword with 2 gold ingot, 1 stick.
You can craft 100 diamond pickaxe with 3 diamond, 2 stick.
You can craft 100 diamond axe with 3 diamond, 2 stick.
You can craft 100 diamond shovel with 1 diamond, 2 stick.
You can craft 100 diamond sword with 2 diamond, 1 stick.
You can collect 2 dirt at forest.
You can collect 2 dirt at swamp.
You can collect 2 dirt at meadow.
You need to have at least 1 diamond shovel to collect 16 dirt at forest. 1 diamond shovel will be consumed.
You need to have at least 1 diamond shovel to collect 16 dirt at swamp. 1 diamond shovel will be consumed.
You need to have at least 1 diamond shovel to collect 16 dirt at meadow. 1 diamond shovel will be consumed.
You need to have at least 1 gold shovel to collect 24 dirt at forest. 1 gold shovel will be consumed.
You need to have at least 1 gold shovel to collect 24 dirt at swamp. 1 gold shovel will be consumed.
You need to have at least 1 gold shovel to collect 24 dirt at meadow. 1 gold shovel will be consumed.
You need to have at least 1 iron shovel to collect 12 dirt at forest. 1 iron shovel will be consumed.
You need to have at least 1 iron shovel to collect 12 dirt at swamp. 1 iron shovel will be consumed.
You need to have at least 1 iron shovel to collect 12 dirt at meadow. 1 iron shovel will be consumed.
You need to have at least 1 stone shovel to collect 8 dirt at forest. 1 stone shovel will be consumed.
You need to have at least 1 stone shovel to collect 8 dirt at swamp. 1 stone shovel will be consumed.
You need to have at least 1 stone shovel to collect 8 dirt at meadow. 1 stone shovel will be consumed.
You need to have at least 1 wood shovel to collect 4 dirt at forest. 1 wood shovel will be consumed.
You need to have at least 1 wood shovel to collect 4 dirt at swamp. 1 wood shovel will be consumed.
You need to have at least 1 wood shovel to collect 4 dirt at meadow. 1 wood shovel will be consumed.
You can collect 1 wood at forest.
You can collect 1 wood at swamp.
You need to have at least 1 diamond axe to collect 4 wood at forest. 1 diamond axe will be consumed.
You need to have at least 1 diamond axe to collect 4 wood at swamp. 1 diamond axe will be consumed.
You need to have at least 1 gold axe to collect 6 wood at forest. 1 gold axe will be consumed.
You need to have at least 1 gold axe to collect 6 wood at swamp. 1 gold axe will be consumed.
You need to have at least 1 iron axe to collect 3 wood at forest. 1 iron axe will be consumed.
You need to have at least 1 iron axe to collect 3 wood at swamp. 1 iron axe will be consumed.
You need to have at least 1 stone axe to collect 2 wood at forest. 1 stone axe will be consumed.
You need to have at least 1 stone axe to collect 2 wood at swamp. 1 stone axe will be consumed.
You need to have at least 1 wood axe to collect 1 wood at forest. 1 wood axe will be consumed.
You need to have at least 1 wood axe to collect 1 wood at swamp. 1 wood axe will be consumed.
You need to have at least 1 diamond shovel to collect 13 gravel at swamp. 1 diamond shovel will be consumed.
You need to have at least 1 gold shovel to collect 20 gravel at swamp. 1 gold shovel will be consumed.
You need to have at least 1 iron shovel to collect 10 gravel at swamp. 1 iron shovel will be consumed.
You need to have at least 1 stone shovel to collect 7 gravel at swamp. 1 stone shovel will be consumed.
You need to have at least 1 wood shovel to collect 3 gravel at swamp. 1 wood shovel will be consumed.
You need to have at least 1 diamond pickaxe to collect 4 cobblestone at forest. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 4 cobblestone at swamp. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 4 cobblestone at meadow. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 4 cobblestone at underground. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 4 cobblestone at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 6 cobblestone at forest. 1 gold pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 6 cobblestone at swamp. 1 gold pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 6 cobblestone at meadow. 1 gold pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 6 cobblestone at underground. 1 gold pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 6 cobblestone at bedrock. 1 gold pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 3 cobblestone at forest. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 3 cobblestone at swamp. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 3 cobblestone at meadow. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 3 cobblestone at underground. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 3 cobblestone at bedrock. 1 iron pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 2 cobblestone at forest. 1 stone pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 2 cobblestone at swamp. 1 stone pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 2 cobblestone at meadow. 1 stone pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 2 cobblestone at underground. 1 stone pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 2 cobblestone at bedrock. 1 stone pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 cobblestone at forest. 1 wood pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 cobblestone at swamp. 1 wood pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 cobblestone at meadow. 1 wood pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 cobblestone at underground. 1 wood pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 cobblestone at bedrock. 1 wood pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 coal at underground. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 coal at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 4 coal at underground. 1 gold pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 4 coal at bedrock. 1 gold pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 coal at underground. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 coal at bedrock. 1 iron pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 1 coal at underground. 1 stone pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 1 coal at bedrock. 1 stone pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 coal at underground. 1 wood pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 1 coal at bedrock. 1 wood pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 iron ore at underground. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 iron ore at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 iron ore at underground. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 iron ore at bedrock. 1 iron pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 1 iron ore at underground. 1 stone pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 1 iron ore at bedrock. 1 stone pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 gold ore at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 gold ore at nether. 1 diamond pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 gold ore at bedrock. 1 iron pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 gold ore at nether. 1 iron pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 diamond at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 diamond at bedrock. 1 iron pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 1 obsidian at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 3 redstone at bedrock. 1 diamond pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 2 redstone at bedrock. 1 iron pickaxe will be consumed.
You need to have at least 1 diamond pickaxe to collect 20 netherrack at nether. 1 diamond pickaxe will be consumed.
You need to have at least 1 gold pickaxe to collect 30 netherrack at nether. 1 gold pickaxe will be consumed.
You need to have at least 1 iron pickaxe to collect 15 netherrack at nether. 1 iron pickaxe will be consumed.
You need to have at least 1 stone pickaxe to collect 10 netherrack at nether. 1 stone pickaxe will be consumed.
You need to have at least 1 wood pickaxe to collect 5 netherrack at nether. 1 wood pickaxe will be consumed.
You can collect 3 reeds at swamp.
You can collect 1 egg at meadow.
You need to have at least 1 diamond sword to collect 4 leather at meadow. 1 diamond sword will be consumed.
You need to have at least 1 gold sword to collect 6 leather at meadow. 1 gold sword will be consumed.
You need to have at least 1 iron sword to collect 3 leather at meadow. 1 iron sword will be consumed.
You need to have at least 1 stone sword to collect 2 leather at meadow. 1 stone sword will be consumed.
You need to have at least 1 wood sword to collect 1 leather at meadow. 1 wood sword will be consumed.
You need to have at least 1 gold sword to collect 3 blaze rod at nether. 1 gold sword will be consumed.
You need to have at least 1 diamond sword to collect 2 ender pearl at underground. 1 diamond sword will be consumed.
You need to have at least 1 diamond sword to collect 2 ender pearl at end. 1 diamond sword will be consumed.
You need to have at least 1 iron sword to collect 2 ender pearl at underground. 1 iron sword will be consumed.
You need to have at least 1 iron sword to collect 2 ender pearl at end. 1 iron sword will be consumed.
You need to have at least 1 diamond sword to collect 1 ender dragon head at end. 1 diamond sword will be consumed.
You can move to forest from swamp.
You can move to forest from meadow.
You can move to forest from underground.
You can move to forest from bedrock.
You can move to swamp from forest.
You can move to swamp from meadow.
You can move to swamp from underground.
You can move to swamp from bedrock.
You can move to meadow from forest.
You can move to meadow from swamp.
You can move to meadow from underground.
You can move to meadow from bedrock.
"""

            if "only_expert_path_dynamics" in condition_list:
                self.base_prompt += """
Below are some rules for the game.
You can collect 1 wood at forest.
You can craft 4 wood plank with 1 wood.
You can craft 4 stick with 2 wood plank.
You can craft 4 stick with 2 wood plank.
You can craft 4 stick with 2 wood plank.
You can craft 10 wood pickaxe with 3 wood plank, 2 stick.
You need to have at least 1 wood pickaxe to collect 1 cobblestone at forest. 1 wood pickaxe will be consumed.
You can craft 20 stone pickaxe with 3 cobblestone, 2 stick.
You can craft 20 stone pickaxe with 3 cobblestone, 2 stick.
You need to have at least 1 stone pickaxe to collect 1 iron ore at underground. 1 stone pickaxe will be consumed.
You can move to meadow from underground.
You can move to swamp from meadow.
You can move to forest from swamp.
You need to have at least 1 stone pickaxe to collect 2 cobblestone at forest. 1 stone pickaxe will be consumed.
You can craft 1 furnace with 8 cobblestone.
You can craft 1 furnace with 8 cobblestone.
You can get 3 iron ingot after smelting with 3 iron ore, 2 wood plank.
You can craft 40 iron pickaxe with 3 iron ingot, 2 stick.
You can craft 40 iron pickaxe with 3 iron ingot, 2 stick.
You need to have at least 1 iron pickaxe to collect 2 diamond at bedrock. 1 iron pickaxe will be consumed.
""".strip()

#             self.base_prompt += """
# Below are the recipes of the game.
# You can get 3 iron ingot after smelting with 3 iron ore, 2 wood plank.
# You can get 3 gold ingot after smelting with 3 gold ore, 2 wood plank.
# You can get 8 iron ingot after smelting with 8 iron ore, 1 coal.
# You can get 8 gold ingot after smelting with 8 gold ore, 1 coal.
# You can craft 4 wood plank with 1 wood.
# You can craft 4 stick with 2 wood plank.
# You can craft 1 furnace with 8 cobblestone.
# You can craft 3 paper with 3 reeds.
# You can craft 1 book with 3 paper, 1 leather.
# You can craft 1 enchanting table with 1 book, 4 obsidian, 2 diamond.
# You can craft 1 clock with 4 gold ingot, 1 redstone.
# You can craft 1 flint with 10 gravel.
# You can craft 4 flint and steel with 1 iron ingot, 1 flint.
# You can craft 2 blaze powder with 1 blaze rod.
# You can craft 1 ender eye with 1 blaze powder, 1 ender pearl.
# You can craft 10 wood pickaxe with 3 wood plank, 2 stick.
# You can craft 10 wood axe with 3 wood plank, 2 stick.
# You can craft 10 wood shovel with 1 wood plank, 2 stick.
# You can craft 10 wood sword with 2 wood plank, 1 stick.
# You can craft 20 stone pickaxe with 3 cobblestone, 2 stick.
# You can craft 20 stone axe with 3 cobblestone, 2 stick.
# You can craft 20 stone shovel with 1 cobblestone, 2 stick.
# You can craft 20 stone sword with 2 cobblestone, 1 stick.
# You can craft 40 iron pickaxe with 3 iron ingot, 2 stick.
# You can craft 40 iron axe with 3 iron ingot, 2 stick.
# You can craft 40 iron shovel with 1 iron ingot, 2 stick.
# You can craft 40 iron sword with 2 iron ingot, 1 stick.
# You can craft 10 gold pickaxe with 3 gold ingot, 2 stick.
# You can craft 10 gold axe with 3 gold ingot, 2 stick.
# You can craft 10 gold shovel with 1 gold ingot, 2 stick.
# You can craft 10 gold sword with 2 gold ingot, 1 stick.
# You can craft 100 diamond pickaxe with 3 diamond, 2 stick.
# You can craft 100 diamond axe with 3 diamond, 2 stick.
# You can craft 100 diamond shovel with 1 diamond, 2 stick.
# You can craft 100 diamond sword with 2 diamond, 1 stick.
# """.strip()

        # self.explicit_thinking_guides = """
        # You should think about these questions.
        # 1. Based on the rules you know, what do you need to do to get a diamond?
        # 2. Based on the current inventory, do you have all of them?
        # 3. If you do not have all of the items you need, based on the rules and doable actions, can you get them now?
        # 4. If no, what do you need or where should you go to get them?
        # """.strip()

        self.explicit_thinking_guides = """
You should think about these questions.
You need to get a diamond.
Based on the rules you know, what subgoals do you need to achieve?
Based on what you see and what you have, what subgoals have you achieved?
If you have not achieved all of the subgoals, based on the rules and doable actions, can you achieve any subgoals now?
If yes, which subgoal do you want to achieve next?
If no, what do you need or where should you go next?
""".strip()


        self.delta_action_prompt_cot = ""
        self.if_optimal_prompt_cot = """
OBSREPRESENTATION    
Is action ACTION the best action you can take? Please think step by step.  
Only give the answer in a new line in JSON format:
{"reasoning": <REASONING>, "feedback": <FEEDBACK>}
Where <FEEDBACK> is one of "YES" or "NO", <REASONING> is a string of your thinking steps.
                    """

        self.action_advising_base_prompt_cot = """
OBSREPRESENTATION
Which action do you choose? Please think step by step.
Only give the answer in a new line in JSON format:
{"reasoning": <REASONING>, "action": <ACTION>}
Where <ACTION> is one of possible actions, <REASONING> is a string of your thinking steps.
                    """

        self.preference_base_prompt_cot = """
OBSREPRESENTATION
Given ACTION1 or ACTION2, which action is better? Please think step by step.
Only give the answer in a new line in JSON format:
{"reasoning": <REASONING>, "preference": <PREFERENCE>}
Where <PREFERENCE> is one of "FIRST" or "SECOND", <REASONING> is a string of your thinking steps.
            """

    def domain_specific_prompt_process(self, data, prompt):
        """
        Remove _ -
        :param data:
        :param prompt:
        :return:
        """

        def history_context_prompt_process(data):
            history = data["history"]
            if len(history) == 0:
                return ""
            history_str = "\nHere is the history of your actions:\n"

            for i in range(0, len(history)):
                templet = "At Step {step}, you observation is: \n {observation}. \n You took action {action}. Then your observation became: \n {next_state}\n".format(step=i, action=self.number_to_action_dict[history[i]["action"]], observation=history[i]["state"], next_state=history[i]["next_state"])
                history_str += templet
            return history_str

        if "explain_legal_action_dynamics" in self.condition_list:
            explain_str = """
            Below are some explanations of the actions you can take.
            """.strip()
            legal_actions = data["possible_actions_index"]
            prompt = prompt.strip() + explain_str + construct_legal_action_rules(self.env_instance, legal_actions, exlucded_actions=[]).strip()

        if "history_context" in self.condition_list:
            prompt += history_context_prompt_process(data)

        # if "explicit_thinking_guides" in self.condition_list:
        #     return replace_symbols_from_str_to_space(prompt, ["_", "-"]).strip() + self.explicit_thinking_guides
        # else:
        #     # Normal case
        #     return replace_symbols_from_str_to_space(prompt, ["_", "-"]).strip()

        return replace_symbols_from_str_to_space(prompt, ["_", "-"]).strip()


