from __future__ import annotations

import argparse
import json
from pathlib import Path
import shutil
import time
from typing import Any, Dict, List, Sequence


SCRIPT_DIR = Path(__file__).resolve().parent

SUITE_CONFIGS: Dict[str, Dict[str, Any]] = {
    "dri": {
        "input": SCRIPT_DIR / "dri.jsonl",
        "output": SCRIPT_DIR / ".." / "dri.evalset.json",
        "session_app_name": "CanadaDRIPlanner",
    },
    "mfp_macro": {
        "input": SCRIPT_DIR / "mfp.jsonl",
        "output": SCRIPT_DIR / ".." / "mfp.evalset.json",
        "session_app_name": "MFPNutritionPlanner",
    },
}


def build_eval_case_name(row: Dict[str, Any], index: int) -> str:
    sample_index = row.get("sample_index")
    if isinstance(sample_index, int):
        return f"sample_{sample_index:05d}_{index:05d}"
    return f"sample_{index:05d}"


def _derive_eval_set_id(output_path: Path) -> str:
    name = output_path.name
    if name.endswith(".evalset.json"):
        return name[: -len(".evalset.json")]
    if name.endswith(".json"):
        return name[: -len(".json")]
    return output_path.stem


def _detect_suite_name(path: Path) -> str:
    name = path.name.lower()
    if "mfp_macro" in name or name.startswith("mfp.") or name == "mfp.jsonl":
        return "mfp_macro"
    if name.startswith("dri.") or name == "dri.jsonl":
        return "dri"
    raise ValueError(
        "Could not determine eval suite from filename. Expected one containing "
        "'dri' or 'mfp'/'mfp_macro'."
    )


def _agent_evalset_paths(suite_name: str, filename: str) -> Sequence[Path]:
    code_root = SCRIPT_DIR.parent
    if suite_name == "mfp_macro":
        return (
            code_root / "BaselineMFPNutritionPlanner" / filename,
            code_root / "OptimizerMFPNutritionPlanner" / filename,
        )
    if suite_name == "dri":
        return (
            code_root / "BaselineCanadaDRIPlanner" / filename,
            code_root / "OptimizerCanadaDRIPlanner" / filename,
        )
    raise ValueError(f"Unsupported eval suite: {suite_name}")


def _desired_app_name_for_path(path: Path, fallback: str) -> str:
    parent_name = path.parent.name
    if parent_name in {"BaselineCanadaDRIPlanner", "BaselineMFPNutritionPlanner"}:
        return "LLMNutritionPlanner"
    if parent_name == "OptimizerCanadaDRIPlanner":
        return "CanadaDRIPlanner"
    if parent_name == "OptimizerMFPNutritionPlanner":
        return "MFPNutritionPlanner"
    return fallback


def _rewrite_session_app_name(evalset_path: Path, app_name: str) -> None:
    with evalset_path.open("r", encoding="utf-8") as handle:
        payload = json.load(handle)

    for eval_case in payload.get("eval_cases", []):
        session_input = eval_case.get("session_input")
        if not isinstance(session_input, dict):
            session_input = {}
            eval_case["session_input"] = session_input
        session_input["app_name"] = app_name

    with evalset_path.open("w", encoding="utf-8") as handle:
        json.dump(payload, handle, indent=2)


def _build_job(
    input_path: Path,
    output_path: Path | None,
    session_app_name: str | None,
) -> Dict[str, Any]:
    suite_name = _detect_suite_name(input_path)
    suite_config = SUITE_CONFIGS[suite_name]
    return {
        "suite_name": suite_name,
        "input_path": input_path,
        "output_path": output_path or Path(suite_config["output"]),
        "session_app_name": session_app_name or str(suite_config["session_app_name"]),
    }


def _default_jobs() -> List[Dict[str, Any]]:
    return [
        _build_job(
            input_path=Path(config["input"]),
            output_path=Path(config["output"]),
            session_app_name=str(config["session_app_name"]),
        )
        for config in SUITE_CONFIGS.values()
    ]


def _write_evalset_to_destinations(
    output_path: Path,
    suite_name: str,
    session_app_name: str,
) -> List[Path]:
    written_paths = [output_path]
    seen_paths = {output_path.resolve()}

    for target_path in _agent_evalset_paths(suite_name, output_path.name):
        resolved_target = target_path.resolve()
        if resolved_target in seen_paths:
            continue
        target_path.parent.mkdir(parents=True, exist_ok=True)
        shutil.copyfile(output_path, target_path)
        written_paths.append(target_path)
        seen_paths.add(resolved_target)

    for path in written_paths:
        desired_app_name = _desired_app_name_for_path(path, session_app_name)
        _rewrite_session_app_name(path, desired_app_name)

    return written_paths


def convert_jsonl_to_evalset(
    input_path: Path,
    output_path: Path,
    query_field: str,
    reference_field: str,
    eval_set_id: str,
    session_app_name: str,
    session_user_id: str,
) -> int:
    eval_cases: List[Dict[str, Any]] = []
    base_timestamp = time.time()

    with input_path.open("r", encoding="utf-8") as handle:
        for idx, line in enumerate(handle, start=1):
            line = line.strip()
            if not line:
                continue

            row = json.loads(line)
            query = row.get(query_field)
            if not isinstance(query, str) or not query.strip():
                continue

            reference = row.get(reference_field, "")
            if not isinstance(reference, str):
                reference = ""

            case_name = build_eval_case_name(row, idx)
            case_timestamp = base_timestamp + (len(eval_cases) * 0.001)
            invocation_id = f"{case_name}_invocation_00001"
            eval_cases.append(
                {
                    "eval_id": case_name,
                    "conversation": [
                        {
                            "invocation_id": invocation_id,
                            "user_content": {
                                "role": "user",
                                "parts": [{"text": query}],
                            },
                            "final_response": {
                                "role": "model",
                                "parts": [{"text": reference}],
                            },
                            "intermediate_data": {
                                "tool_uses": [],
                                "tool_responses": [],
                                "intermediate_responses": [],
                            },
                            "creation_timestamp": case_timestamp,
                        }
                    ],
                    "session_input": {
                        "app_name": session_app_name,
                        "user_id": session_user_id,
                        "state": {},
                    },
                    "creation_timestamp": case_timestamp,
                }
            )

    evalset: Dict[str, Any] = {
        "eval_set_id": eval_set_id,
        "name": eval_set_id,
        "eval_cases": eval_cases,
        "creation_timestamp": base_timestamp,
    }

    output_path.parent.mkdir(parents=True, exist_ok=True)
    with output_path.open("w", encoding="utf-8") as handle:
        json.dump(evalset, handle, indent=2)

    return len(eval_cases)


def _convert_job(
    *,
    suite_name: str,
    input_path: Path,
    output_path: Path,
    query_field: str,
    reference_field: str,
    eval_set_id: str | None,
    session_app_name: str,
    session_user_id: str,
) -> Dict[str, Any]:
    resolved_eval_set_id = eval_set_id or _derive_eval_set_id(output_path)
    count = convert_jsonl_to_evalset(
        input_path=input_path,
        output_path=output_path,
        query_field=query_field,
        reference_field=reference_field,
        eval_set_id=resolved_eval_set_id,
        session_app_name=session_app_name,
        session_user_id=session_user_id,
    )
    written_paths = _write_evalset_to_destinations(
        output_path=output_path,
        suite_name=suite_name,
        session_app_name=session_app_name,
    )
    return {
        "suite_name": suite_name,
        "count": count,
        "session_app_name": session_app_name,
        "written_paths": written_paths,
    }


def _print_results(results: Sequence[Dict[str, Any]]) -> None:
    for result in results:
        print(f"Wrote {result['count']} eval cases for {result['suite_name']} to:")
        for path in result["written_paths"]:
            app_name = _desired_app_name_for_path(path, result["session_app_name"])
            print(f"- {path.resolve()} (app_name={app_name})")


def main() -> None:
    parser = argparse.ArgumentParser(
        description=(
            "Convert one or both suite JSONL files into ADK eval set JSON format. "
            "When run without --input, both default suites are generated."
        )
    )
    parser.add_argument(
        "--input",
        default=None,
        help=(
            "Optional input JSONL file path. If omitted, the script generates both "
            "dri and mfp evalsets."
        ),
    )
    parser.add_argument(
        "--output",
        default=None,
        help=(
            "Optional output eval set JSON file path. Only valid together with a "
            "single --input."
        ),
    )
    parser.add_argument(
        "--query-field",
        default="profile_sentence",
        help="JSON field to use as user query.",
    )
    parser.add_argument(
        "--reference-field",
        default="reference",
        help="Optional JSON field to use as expected response.",
    )
    parser.add_argument(
        "--eval-set-id",
        default=None,
        help="Eval set identifier for the output. Defaults to output filename stem.",
    )
    parser.add_argument(
        "--session-app-name",
        default=None,
        help="Optional app_name for the base eval file when generating a single suite.",
    )
    parser.add_argument(
        "--session-user-id",
        default="eval_user",
        help="Session user_id injected into each eval case session_input.",
    )
    args = parser.parse_args()

    if args.output and not args.input:
        parser.error("--output requires --input.")
    if args.eval_set_id and not args.input:
        parser.error("--eval-set-id requires --input.")

    if args.input:
        jobs = [
            _build_job(
                input_path=Path(args.input),
                output_path=Path(args.output) if args.output else None,
                session_app_name=args.session_app_name,
            )
        ]
    else:
        jobs = _default_jobs()

    results: List[Dict[str, Any]] = []
    for job in jobs:
        results.append(
            _convert_job(
                suite_name=job["suite_name"],
                input_path=job["input_path"],
                output_path=job["output_path"],
                query_field=args.query_field,
                reference_field=args.reference_field,
                eval_set_id=args.eval_set_id,
                session_app_name=job["session_app_name"],
                session_user_id=args.session_user_id,
            )
        )

    _print_results(results)


if __name__ == "__main__":
    main()
