import requests
import json
import numpy as np
import re
import numpy as np



def object_ext_llm_prompt(text: str):
    prompt = (
        "Your task is to strictly extract structured information from the given text.\n\n"
        "Format rules (follow exactly):\n"
        "1) Line 1 — MAIN OBJECT: write ONLY ONE object — the single target object of the command — optionally followed by comma-separated "
        "visual attributes (e.g., color, shape, size, texture, material, distinctive markings). Use this format: object_name[, attribute1, attribute2...]. "
        "Include only visual attributes. Do NOT include non-visual info (function, state, quantity, actions, context). "
        "NEVER list more than one object here. Do NOT include spatial attributes (front, back, left, right, above, below, between, closest, farthest, supported-by, supporting).\n"
        "2) Line 2 — RELATED OBJECTS: list ALL related objects and their visual attributes using this exact pattern for each item and "
        "separate items with a semicolon and a space:\n"
        "   object_name[, attribute1, attribute2...]; object_name2[, attribute1...]\n"
        "   Do NOT repeat the main object here. Do NOT include spatial attributes (front, back, left, right, above, below, between, closest, farthest, supported-by, supporting). "
        "If there are no related objects, leave this line completely blank (an empty line). Do NOT write 'None', 'N/A', 'no visual image', "
        "'unknown', or any other placeholder.\n"
        "3) Line 3 — RELATION KEYWORD: write EXACTLY ONE of these words (lowercase) that best describes the spatial relation between the "
        "main object and the related objects:\n"
        "   closest, farthest, left, right, front, back, below, supported-by, above, supporting, between\n"
        "   Nothing else on this line.\n"
        "4) Line 4 — ORIENTATION IMPORTANCE: list which objects have an orientation/viewpoint that matters for the command. Use the exact "
        "format for each item: object_name: orientation. Allowed orientation keywords (lowercase) are: front, back, left, right. "
        "Separate multiple items with a comma and a space.\n"
        "   If orientation/viewpoint does NOT matter for any object, leave this line completely blank. Do NOT write 'None', 'N/A', or any placeholder.\n"
        "5) If an attribute cannot be determined, simply omit it (do not invent or insert placeholders).\n"
        "6) Do not enclose output in quotes or code blocks, do not add labels like 'Line 1', and do not add punctuation or extra characters "
        "beyond the specified formats.\n\n"
        f"Text: {text}\n\n"
        "Return the output in exactly four lines as instructed above."
    )
    return prompt


def parse_llm_object_ext_output(raw_output: str) -> dict:
    """
    Parse the 4-line structured output from the LLM into a dictionary.

    Expected format of raw_output:
        line 1 -> main object (with optional visual attributes)
        line 2 -> related objects (semicolon-separated, may be empty)
        line 3 -> relation keyword
        line 4 -> orientation importance (comma-separated key:value, may be empty)
    """
    lines = raw_output.strip().split("\n")

    # Ensure at least 4 lines (fill missing with empty strings)
    while len(lines) < 4:
        lines.append("")

    # Lowercase everything
    main_object = lines[0].strip().lower()
    related_objects_line = lines[1].strip().lower()
    relation = lines[2].strip().lower()
    orientation_line = lines[3].strip().lower()

    # Remove extra commas or spaces in main object
    main_object = " ".join(main_object.split())

    # Parse related objects into list, remove extra commas/spaces inside each object
    related_objects = []
    if related_objects_line:
        for obj in related_objects_line.split(";"):
            obj_clean = " ".join(obj.strip().split())
            if obj_clean:
                related_objects.append(obj_clean)

    # Parse orientation importance into dict, remove extra spaces
    orientation_importance = {}
    if orientation_line:
        parts = [p.strip() for p in orientation_line.split(",") if p.strip()]
        for part in parts:
            if ":" in part:
                obj, orient = part.split(":", 1)
                orientation_importance[" ".join(obj.strip().split())] = orient.strip()

    return {
        "raw_output": raw_output,
        "main_object": main_object if main_object else None,
        "related_objects": related_objects,
        "relation": relation if relation else None,
        "orientation_importance": orientation_importance,
    }



def send_to_llm(prompt,model, api):
    response = requests.post(
    url="https://openrouter.ai/api/v1/chat/completions",
    headers={
        "Authorization": "Bearer " + api,
        "Content-Type": "application/json"
    },
    data=json.dumps({
        "model": model,
        "messages": [
        {
            "role": "user",
            "content": prompt
        }
        ],
        
    })
    )

    if response.status_code == 200:
        response_json = response.json()
        message = response_json.get("choices", [{}])[0].get("message", {}).get("content", "No content found.")
        return message
    else:
        return ("Request failed with status code:", response.status_code), ("Response content:", response.text)




def llm_object_extractor(text, model , api_key ):
    prompt = object_ext_llm_prompt(text)
    llm_o = send_to_llm(prompt,model, api_key)
    print(llm_o)
    return parse_llm_object_ext_output(llm_o)
    



def build_llm_prompt(main_object, main_candidates, other_objects, prompt_text):

    prompt = []
    
    # description
    prompt.append(f'Text: "{prompt_text}"\n')
    
    # main object candidates
    prompt.append(f'The main object is "{main_object}".')
    prompt.append("It has the following candidate positions with indices:")
    for i, pos in enumerate(main_candidates):
        pos_str = ", ".join([f"{coord:.2f}" for coord in np.array(pos).flatten()])
        prompt.append(f"Index {i}: ({pos_str})")
    
    # print(other_objects)
    # other objects
    if other_objects:
        prompt.append("\nOther objects and their positions are:")
        for obj_name, centers in other_objects.items():
            # print('***************', obj_name, centers)
            for j, pos in enumerate(centers):
                pos_str = ", ".join([f"{float(p):.2f}" for p in pos])
                prompt.append(f"{obj_name} [{j}]: ({pos_str})")
    
    # instruction
    prompt.append(
        "\nInstruction:\n"
        f'Based on the text above, decide which candidate index of "{main_object}" is the correct target.\n'
        "Return only the numeric index (e.g., 0, 1, 2, ...). Do not return anything else."
    )
    
    return "\n".join(prompt)




def parse_final_llm(output_str):
    """
    Extracts all integers from the LLM output string
    and returns the last one as an int.
    
    output_str: str, raw output from LLM
    
    Returns: int or None if no number found
    """
    numbers = re.findall(r"\d+", output_str)
    if not numbers:
        return None
    return int(numbers[-1])



def build_llm_prompt_view(main_object, main_candidates, other_objects, prompt_text, orientation):
    prompt = []
    
    # description
    prompt.append(f'Text: "{prompt_text}"\n')
    
    # main object candidates
    prompt.append(f'The main object is "{main_object}".')
    prompt.append("It has the following candidate positions with indices (x, y, z where z is height):")
    for i, pos in enumerate(main_candidates):
        coords = np.array(pos).flatten()
        if len(coords) >= 3:
            pos_str = f"x={coords[0]:.2f}, y={coords[1]:.2f}, z={coords[2]:.2f}"
        else:
            pos_str = ", ".join([f"{coord:.2f}" for coord in coords])
        prompt.append(f"Index {i}: ({pos_str})")
    
    # other objects
    if other_objects:
        prompt.append("\nOther objects and their positions are:")
        for obj_name, centers in other_objects.items():
            for j, pos in enumerate(centers):
                coords = np.array(pos).flatten()
                if len(coords) >= 3:
                    pos_str = f"x={coords[0]:.2f}, y={coords[1]:.2f}, z={coords[2]:.2f}"
                else:
                    pos_str = ", ".join([f"{coord:.2f}" for coord in coords])
                prompt.append(f"{obj_name} [{j}]: ({pos_str})")
    
    # helper for axis explanation
    def axis_text(a):
        a = a % 360
        if a == 0: return "positive x direction"
        if a == 90: return "positive y direction"
        if a == 180: return "negative x direction"
        if a == 270: return "negative y direction"
        if 0 < a < 90: return "between positive x and positive y"
        if 90 < a < 180: return "between positive y and negative x"
        if 180 < a < 270: return "between negative x and negative y"
        if 270 < a < 360: return "between negative y and positive x"
        return ""
    
    # orientation (with x,y explanation)
    if orientation:
        prompt.append("\nOrientation information (object, orientation_label) and angles in degrees:")
        for key, angles in orientation.items():
            if isinstance(key, tuple) and len(key) >= 2:
                obj_name = str(key[0])
                ori_label = str(key[1])
            else:
                obj_name = str(key)
                ori_label = None
            
            angles_arr = np.array(angles).flatten()
            if angles_arr.size == 0:
                continue
            
            angle = float(angles_arr[0])  # assume one main angle
            if ori_label:
                prompt.append(f"{obj_name} ({ori_label}): [{angle:.2f}]")
                
                # compute directions
                left = (angle + 90) % 360
                right = (angle - 90) % 360
                back = (angle + 180) % 360
                
                prompt.append(
                    f"When facing {ori_label} ({angle:.0f}°): "
                    f"Forward = {angle:.0f}° ({axis_text(angle)}), "
                    f"Left = {left:.0f}° ({axis_text(left)}), "
                    f"Right = {right:.0f}° ({axis_text(right)}), "
                    f"Back = {back:.0f}° ({axis_text(back)})."
                )
            else:
                angles_str = ", ".join([f"{a:.2f}" for a in angles_arr])
                prompt.append(f"{obj_name}: [{angles_str}]")
    
    # instruction
    prompt.append(
        "\nInstruction:\n"
        f'Based on the text above, decide which candidate index of "{main_object}" is the correct target.\n'
        "Return only the numeric index (e.g., 0, 1, 2, ...). Do not return anything else."
    )
    
    return "\n".join(prompt)


    
    
def final_llm(main_object, main_candidates, other_objects, prompt_text, model , api_key, orientation ={}):
    if len(orientation)>0:
        prompt = build_llm_prompt_view(main_object, main_candidates, other_objects, prompt_text, orientation)
    else:
        prompt = build_llm_prompt(main_object, main_candidates, other_objects, prompt_text)
    llm_o = send_to_llm(prompt,model, api_key)
    return parse_final_llm(llm_o)
