import json
import uuid
import os
from typing import Dict, List, Any
from core.environment import WorkEnvironment

class MessagesParser:

    def load_datasets_messages(self, dataset_item: Dict) -> Dict:
        """
        return: {"tools": [...], "initial_query": str, "full_messages": [...]}
        """
        tools = dataset_item.get("tools", [])
        messages = dataset_item.get("messages", [])
        
        initial_query = ""
        for msg in messages:
            if msg["role"] == "user":
                initial_query = msg["content"]
                break
        
        return {
            "tools": tools,
            "initial_query": initial_query,
            "full_messages": messages
        }


    def transform_ENV_to_messages(self, system_msg: str, history_records: List[Dict], dataset_id: str, tools: List[Dict], save_dir: str) -> List[Dict]:
        """
        Args:
            history_records: List[Dict], snapshot_record
            dataset_id
        """
        full_case_messages = []
        
        if system_msg:
            full_case_messages.append({
                "role": "system",
                "content": system_msg
            })

        def get_attr(obj, name, default=None):
            if isinstance(obj, dict):
                return obj.get(name, default)
            return getattr(obj, name, default)

        for record in history_records:
            env = record.get("WorkEnvironment", {})
            finish_msg = record.get("finish_msg", "")
            
            # --- 1. User Message ---
            objectives = get_attr(env, 'objective', [])
            if objectives:
                current_turn_objective = objectives[-1]
                full_case_messages.append({
                    "role": "user",
                    "content": current_turn_objective
                })

            # --- 2. Tool Execution Process (Thinking -> Tool Calls -> Outputs) ---
            thinking_history = get_attr(env, 'thinking_history', [])
            dispatch_list_history = get_attr(env, 'dispatch_list_history', [])
            task_history = get_attr(env, 'task_history', [])
            
            steps_count = len(thinking_history)
            available_tasks = list(task_history)

            last_turn_thinking = None

            for i in range(steps_count):
                thought = thinking_history[i]
                dispatch_batch = dispatch_list_history[i]

                if thought:
                    last_turn_thinking = thought

                if dispatch_batch:
                    assistant_msg = {
                        "role": "assistant",
                        "content": thought if thought else None,
                        "tool_calls": []
                    }
                    tool_calls_obj = []
                    tool_outputs_data = []

                    for dispatch_str in dispatch_batch:
                        matched_task = None
                        for task in available_tasks:
                            if get_attr(task, "context") == dispatch_str:
                                matched_task = task
                                break
                        
                        if matched_task:
                            available_tasks.remove(matched_task)
                            
                            fc_content = get_attr(matched_task, "fc_content", {})
                            if isinstance(fc_content, str):
                                try: fc_content = json.loads(fc_content)
                                except: fc_content = {}
                            

                            tool_name = fc_content.get("name", "unknown_tool")
                            tool_args = fc_content.get("arguments", {})
                            
                            call_id = f"call_{uuid.uuid4().hex[:8]}"
                            
                            tool_calls_obj.append({
                                "id": call_id,
                                "type": "function",
                                "function": {
                                    "name": tool_name,
                                    "arguments": json.dumps(tool_args, ensure_ascii=False)
                                }
                            })
                            
                            raw_result = get_attr(matched_task, "result", "")
                            result_content = raw_result

                            tool_outputs_data.append({
                                "tool_call_id": call_id,
                                "name": tool_name,
                                "content": result_content
                            })

                    if tool_calls_obj:
                        assistant_msg["tool_calls"] = tool_calls_obj
                        full_case_messages.append(assistant_msg)
                        
                        for output in tool_outputs_data:
                            full_case_messages.append({
                                "role": "tool",
                                "tool_call_id": output["tool_call_id"],
                                "name": output["name"],
                                "content": output["content"]
                            })

            full_case_messages.append({
                "role": "assistant",
                "reasoning_content": last_turn_thinking,
                "content": record.get("finish_msg") or get_attr(env, 'scratchpads', [])[-1]
            })

        final_result = {
            "tools": tools,
            "messages": full_case_messages
        }

        # --- Save to File ---
        results_dir = os.path.join(save_dir, 'messages')
        if not os.path.exists(results_dir):
            os.makedirs(results_dir)
        
        file_path = os.path.join(results_dir, f"{dataset_id}.json")
        with open(file_path, 'w', encoding='utf-8') as f:
            json.dump(final_result, f, indent=4, ensure_ascii=False)

        return final_result
