"""
Batch task proposal script.

Accepts either a list of local file paths or a local directory and runs the Claude
task proposer agent on each file. For the evaluation environment, the file path is
constructed as: <onedrive_prefix>/<basename(local_file)>, so the file must already
exist in OneDrive under that prefix. Writes proposed tasks per file into a JSON
file, using the `Task` structure from `officearena.environments.task` and extracting
any leading tags (e.g., "[EASY]", "[MEDIUM]", "[HARD]") into `misc['tags']`.
"""

import argparse
import json
import os
import re
from dataclasses import asdict
from pathlib import Path
from typing import List, Tuple

from officearena.agents import ClaudeTaskProposer
from officearena.environments import OfficeArena
from officearena.environments.task import Task
from officearena.utils.task_proposal import proposed_tasks


def parse_task_string(task_str: str) -> Tuple[str, List[str]]:
    tags: List[str] = []
    remaining = task_str

    while True:
        match = re.match(r"^\s*\[(?P<tag>[^\]]+)\]\s*", remaining)
        if not match:
            break
        tags.append(match.group("tag").strip())
        remaining = remaining[match.end() :]

    goal = remaining.strip(" \t\r\n:;-—")
    return goal, tags


def discover_files(files: List[str], directory: str | None) -> List[str]:
    """Resolve input files.

    - If `directory` is a local directory, scan for supported Office file types.
    - Only include explicitly provided `files` and locally discovered files.
    """

    discovered: List[str] = []
    if files:
        discovered.extend(files)

    if directory:
        dir_path = Path(directory)
        if dir_path.exists() and dir_path.is_dir():
            for ext in ("*.pptx", "*.ppt", "*.docx", "*.doc", "*.xlsx", "*.xls"):
                for p in sorted(dir_path.glob(ext)):
                    discovered.append(str(p))
        else:
            print(f"Warning: --dir '{directory}' is not a local directory. Skipping directory discovery.")

    seen = set()
    unique: List[str] = []
    for fp in discovered:
        if fp not in seen:
            unique.append(fp)
            seen.add(fp)
    return unique


def tasks_to_serializable(file_path: str, task_strings: List[str]) -> dict:
    serializable_tasks: List[dict] = []
    base_stem = Path(file_path).stem

    for idx, raw in enumerate(task_strings, start=1):
        goal, tags = parse_task_string(raw)
        task = Task(
            task_id=f"{base_stem}-{idx:03d}",
            goal=goal,
            grader=None,
            tags=tags,
            file_path=file_path,
        )
        serializable_tasks.append(asdict(task))

    return {
        "file": file_path,
        "num_tasks": len(serializable_tasks),
        "tasks": serializable_tasks,
    }


def run_for_file(
    env: OfficeArena,
    agent: ClaudeTaskProposer,
    file_path: str,
    task_instruction: str,
    screenshot_dir_base: str | Path,
) -> List[str]:
    proposed_tasks.set([])
    try:
        env.evaluate_agent(
            agent=agent,
            file_path=file_path,
            task_instruction=task_instruction,
            save_screenshots=True,
            screenshot_dir=str(Path(screenshot_dir_base) / f"claude_task_proposer_{Path(file_path).stem}_screenshots"),
        )
    except Exception as e:
        print(f"Warning: evaluation error for '{file_path}': {e}")

    return proposed_tasks.get()


def main():
    parser = argparse.ArgumentParser(description="Batch propose tasks for Office files")
    parser.add_argument("--files", nargs="*", default=[], help="Specific local file paths to evaluate")
    parser.add_argument(
        "--dir",
        default=None,
        help="Local directory of files to evaluate (scans for .pptx, .ppt, .docx, .doc, .xlsx, .xls).",
    )
    parser.add_argument(
        "--onedrive-prefix",
        required=True,
        help="OneDrive directory prefix (relative to your OneDrive root configured in OfficeArena), e.g. 'PowerPoint' or 'Excel'. The evaluated file path becomes '<prefix>/<basename>'.",
    )
    parser.add_argument("--output-dir", default="proposed_tasks", help="Directory to write per-file JSON outputs")
    parser.add_argument(
        "--overwrite",
        action="store_true",
        help="Recompute outputs even if a JSON for a file already exists (default: False)",
    )
    parser.add_argument("--headless", action="store_true", help="Run browser headless (default: False)")
    parser.add_argument("--max-steps", type=int, default=35, help="Max steps per evaluation")
    parser.add_argument("--step-delay", type=float, default=2.0, help="Delay between steps in seconds")
    parser.add_argument("--display-width", type=int, default=1024)
    parser.add_argument("--display-height", type=int, default=768)
    args = parser.parse_args()

    try:
        from dotenv import load_dotenv

        load_dotenv()
        print("Loaded environment variables from .env file.")
    except ImportError:
        print("dotenv not installed. Relying on shell environment variables.")

    client_id = os.getenv("CLIENT_ID")
    claude_model_name = os.getenv("CLAUDE_MODEL_NAME")
    claude_base_url = os.getenv("CLAUDE_BASE_URL")
    claude_api_key = os.getenv("CLAUDE_API_KEY", {})

    if not client_id or not claude_model_name:
        print("---" * 10)
        print("ERROR: Missing required environment variables.")
        print("Please ensure CLIENT_ID, CLAUDE_MODEL_NAME, and CLAUDE_API_KEY are set.")
        print("---" * 10)
        return

    files_to_run = discover_files(args.files, args.dir)
    if not files_to_run:
        print("No input files provided. Use --files or --dir.")
        return

    output_dir = Path(args.output_dir)
    output_dir.mkdir(parents=True, exist_ok=True)

    task_instruction = (
        "Explore the current file and propose tasks to add to the dataset. "
        "When adding tasks to the dataset tag each task as easy, medium or hard. "
        "Also add a slide number for each task. "
        "You can do this by using the function 'add_tasks_to_dataset' with a list of tasks "
        "and using the '[DIFFICULTY][SLIDE:N] task' format for each task you add to the dataset. "
        "Make sure to include a variety of tasks that real users would want to do. "
        "Though, the benchmark will evaluate computer use agents instead of actual people, so do not propose tasks that require personal information. "
        "In our benchmark, we will be creating reward functions for each task using a mix of programmatic validation in python "
        "using python-pptx and LLMs/VLMs with slide screensot access (only slides, not the GUI, notes, comments, etc.) and some animation/transition validation. "
        "Please make sure to limit proposed tasks to ones that can be evaluated automatically in such a manner. "
        "E.g., do not propose tasks related video, audio, etc. that cannot be evaluated with just the above context. "
        "Note that there may be more slides than what you can see in the current view, so you may need to scroll to see all slides. "
        "You can add tasks as you are exploring the file, instead of waiting until the very end. "
        "When you are done, call the function 'finish' with a message to the user with a reason for finishing."
    )

    display_size = {"width": args.display_width, "height": args.display_height}

    env = OfficeArena(
        client_id=client_id,
        headless=args.headless,
        max_steps=args.max_steps,
        step_delay=args.step_delay,
        resolution=(display_size["width"], display_size["height"]),
    )

    agent_config = {
        "model_name": claude_model_name,
        "api_key": claude_api_key,
        "base_url": claude_base_url,
        "display_size": display_size,
    }
    agent = ClaudeTaskProposer(config=agent_config)

    for file_path in files_to_run:
        print("-" * 60)
        print(f"Evaluating: {file_path}")
        # Construct the OneDrive path used by the environment
        remote_path = f"{args.onedrive_prefix.rstrip('/')}/{Path(file_path).name}"
        task_strings: List[str] = []
        out_path = output_dir / f"{Path(file_path).stem}.proposed_tasks.json"

        if out_path.exists() and not args.overwrite:
            print(f"Skipping {file_path} (output already exists at {out_path}). Use --overwrite to recompute.")
            continue
        try:
            task_strings = run_for_file(
                env,
                agent,
                remote_path,
                task_instruction,
                screenshot_dir_base=output_dir,
            )
        except Exception as e:
            print(f"Failed to evaluate {remote_path}: {e}")
            try:
                task_strings = proposed_tasks.get() or []
            except Exception:
                task_strings = []

        payload = tasks_to_serializable(remote_path, task_strings)
        try:
            with out_path.open("w", encoding="utf-8") as f:
                json.dump(payload, f, ensure_ascii=False, indent=2)
            print(f"Wrote {payload['num_tasks']} tasks → {out_path}")
        except Exception as e:
            print(f"Error writing tasks for {file_path} to {out_path}: {e}")


if __name__ == "__main__":
    main()
