
import pandas as pd
import random
random.seed(42)

import json
SYSTEM_PROMPT_FOR_ACTION = """You are an Action Agent responsible for achieving a text-based task. 
"""

NEW_FORMAT = """
Attention:
1. You MUST provide your thought (one or two lines) before taking action, put the thought in the <think>...</think>.
2. You MUST issue only ONE action in each interaction stage, and put the action in the <answer>...</answer>.

Use the following format:
<think> put your thought here </think>
<answer> put your action here </answer>

Please provide your response on the task following the format strictly.
"""

def read_json(path):
    with open(path, 'r', encoding='utf8') as f:
        return json.loads(f.read())

def write_to_json(data, path):
    with open(path, 'w', encoding='utf8') as f:
        f.write(json.dumps(data, ensure_ascii=False, indent=4))


Format_String = [
    "\"Thought: your thoughts.\nAction: your next action\n\"",
    "Thought:\n<Your Thought>\n\nAction:\n<Your Action>",
    "Thought:\n<Your Thought>\n\nAction:\n<The Word You Guess>",
    "Thought:\nyour thoughts.\n\nAction:\nyour next action",
    "Thought: Your thought here.\n\nAction: ```sql\nSELECT * FROM table WHERE condition;\n```",
    "Thought:\n ... \n\nAction:\n ...",
    "Thought: [your thought]\n\nAction: [your action] with Action Input: [your action input]",
    "Thought:\nI think ... \n\nAction: \nclick[something]"
]

def process(conversation):
    system_prompt = SYSTEM_PROMPT_FOR_ACTION
    user_prompt = conversation[0]["value"] + "\n\n" + conversation[2]["value"]

    user_prompt += "\n\n" + NEW_FORMAT

    messages = [
        {
            "role": "system",
            "content": system_prompt,
            "cal_loss": False
        },
        {
            "role": "user",
            "content": user_prompt,
            "cal_loss": False
        }
    ]
    for conv in conversation[3:]:
        if conv["from"] == "gpt":
            thought = conv["value"].split("Thought:")[-1].split("Action:")[0].strip()
            action = conv["value"].split("Action:")[-1].strip()
            content = f"<think> {thought} </think>\n<answer> {action} </answer>"

        elif conv["from"] == "human":
            obs = conv["value"].split("Observation:")[-1].split("Give me one action.")[0].strip()
            content = obs
        else:
            raise ValueError("unknown role")

        messages.append({
            "role": "user" if conv["from"] == "human" else "assistant",
            "content": content,
            "cal_loss": True if conv["loss"] else False
        })
    
    return messages


if __name__ == "__main__":
    # remove babyai
    paths = [
        "../data/AgentGym/alfworld_train.json",
        "../data/AgentGym/lmrlgym_maze_train.json",
        "../data/AgentGym/lmrlgym_wordle_train.json",
        "../data/AgentGym/sciworld_train.json",
        "../data/AgentGym/sqlgym_train.json",
        "../data/AgentGym/textcraft_train.json",
        "../data/AgentGym/tool_movie_train.json",
        "../data/AgentGym/tool_todo_train.json",
        "../data/AgentGym/tool_weather_train.json",
        "../data/AgentGym/webshop_train.json",
    ]
    total_new_data = []
    for path in paths:
        data = read_json(path)
        for item in data:
            total_new_data.append({
                "id": item["item_id"],
                "messages": process(item["conversations"])
            })
    
    random.shuffle(total_new_data)
    print(len(total_new_data))
    out_path = "train_data/agent-gym_v1.json"
    write_to_json(total_new_data, out_path)
