import json


def split_single_message_list(messages, trajectory):
    """
    Split a single message list into multiple rounds.

    Args:
        messages (list): List of message dictionaries with 'role' and 'content' keys

    Returns:
        list: List of rounds, where each round contains messages and remaining chat
    """
    message_list = [[messages[0]]]
    for i in range(1, len(messages), 2):
        if i == len(messages)-1:
            message_list.append([messages[i]])
        else:
            message_list.append([messages[i], messages[i+1]])
    question_name_map = {}
    for i, q_name in enumerate(trajectory[-1][0]):
        question_name_map.update({q_name: message_list[i+1]})
    
    rounds = []
    history_messages = []
    for i in range(len(trajectory)):
        history_messages.extend(message_list[i])
        round_entry = {"round_number": i+1, "messages": history_messages.copy()}
        if trajectory[i][-1] == []:
            remaining_messages = [message_list[-1][0]]
        else:
            remaining_messages = []
        for q_name in trajectory[i][-1]:
            remaining_messages.extend(question_name_map[q_name])
        if remaining_messages:
            remaining_chat_parts = []
            info_set = []
            for msg in remaining_messages:
                role = msg.get("role", "")
                content = msg.get("content", "")
                remaining_chat_parts.append(f"{role}: {content}")
                if role == "assistant":
                    info_set.append(content)
            round_entry["remaining_chat"] = "\n".join(remaining_chat_parts)
            round_entry["info_set"] = info_set
        else:
            round_entry["remaining_chat"] = ""
        rounds.append(round_entry)

    return rounds


def split_session_to_json_lines(session):
    """
    Split a session dictionary into multiple rounds and convert to JSON lines.

    Args:
        session (dict): Session dictionary containing 'session_id', 'topic', and 'messages' keys
            - session_id (str): Session identifier
            - topic (str): Topic information
            - messages (list): List of message dictionaries with 'role' and 'content' keys

    Returns:
        list: List of JSON strings, each representing a round with cid, session_id, topic, messages, and remaining_chat
    """
    rounds = split_single_message_list(session["messages"], session["trajectory"])

    json_lines = []
    for round_data in rounds:
        round_entry = {
            "cid": f"{session['session_id']}_{round_data['round_number']}",
            "session_id": session["session_id"],
            "topic": session.get("topic", ""),  # Use topic instead of diagn
            "messages": round_data["messages"],
            "remaining_chat": round_data["remaining_chat"],
            "info_set": round_data.get("info_set", [])
        }

        json_lines.append(json.dumps(round_entry, ensure_ascii=False))

    return json_lines

def filter_redundant_chats(chat_list):
    filtered_list = []
    for item in chat_list:
        if "messages" not in item or "remaining_chat" not in item:
            filtered_list.append(item)
            continue

        messages = item["messages"]
        remaining_chat_str = item["remaining_chat"]

        formatted_messages_parts = [f"{msg['role']}: {msg['content']}" for msg in messages]
        messages_as_string = "\n\n".join(formatted_messages_parts)

        if messages_as_string != remaining_chat_str:
            filtered_list.append(item)

    return filtered_list

