#!/usr/bin/env python3
"""
Generate Videos from Evaluation Output Frames

This utility traverses nested evaluation directory structures to locate "leaf" 
folders containing extracted visualization frames. Each isolated sequence is 
compiled into a continuous MP4 format for qualitative review.
"""

from __future__ import annotations

import argparse
import os
import re
import sys
from pathlib import Path
from typing import List, Set

# Base configuration paths and parameters
SCRIPT_DIR = Path(__file__).resolve().parent
DEFAULT_INPUT_ROOT = SCRIPT_DIR / "Outputs"
DEFAULT_OUTPUT_ROOT = SCRIPT_DIR / "VideoOutputs"
DEFAULT_FPS = 30.0
DEFAULT_CODEC = "mp4v"
DEFAULT_IMAGE_EXTS = {".png", ".jpg", ".jpeg", ".bmp", ".tif", ".tiff", ".webp"}

# Regex compiler to split filenames for natural sequence ordering
_NATURAL_RE = re.compile(r"(\d+)")

def natural_sort_key(p: Path) -> list:
    """
    Constructs a sorting key ensuring numerical consistency.
    Standard alphabetic sort places '10' before '2'. Splitting integers 
    forces string-to-number type promotion, making '2' precede '10'.
    """
    parts = _NATURAL_RE.split(p.name.lower())
    return [int(tok) if tok.isdigit() else tok for tok in parts]

def collect_leaf_dirs(root: Path, exts: Set[str]) -> List[Path]:
    """
    Locate terminal subdirectories that actually house output frames.
    It does so by checking 'dirnames'—an empty directory array indicates a leaf.
    This guarantees frames are collated independently for distinct scenes.
    """
    leaves: List[Path] = []
    for dirpath, dirnames, filenames in os.walk(root):
        if not dirnames:
            if any(Path(f).suffix.lower() in exts for f in filenames):
                leaves.append(Path(dirpath))
    leaves.sort()
    return leaves

def sorted_images(directory: Path, exts: Set[str]) -> List[Path]:
    """
    Aggregates image frames from a directory in correct chronological sequence
    by enforcing natural sort via `natural_sort_key`.
    """
    imgs = [
        p for p in directory.iterdir()
        if p.is_file() and p.suffix.lower() in exts
    ]
    imgs.sort(key=natural_sort_key)
    return imgs

def relative_or_abs(path: Path, root: Path) -> Path:
    """
    Returns a brief, relative folder path when possible to keep CLI stdout
    lean and highly readable instead of printing massive string literals.
    """
    try:
        return path.relative_to(root)
    except ValueError:
        return path

def load_bgr_uint8(path: Path):
    """
    Reads incoming frames safely with OpenCV and strictly forces them into
    a uniform format (BGR color order, 8-bit unsigned integer).
    Missing files or mismatched formats trigger errors in OpenCV's MP4 encoder,
    so homogenization logic buffers those problems here.
    """
    import cv2
    import numpy as np

    frame = cv2.imread(str(path), cv2.IMREAD_UNCHANGED)
    if frame is None:
        raise ValueError(f"Cannot read image: {path}")

    # Explicit format casting ensures non-3-channel images don't derail encoding.
    if frame.ndim == 2:
        frame = cv2.cvtColor(frame, cv2.COLOR_GRAY2BGR)
    elif frame.ndim == 3 and frame.shape[2] == 4:
        frame = cv2.cvtColor(frame, cv2.COLOR_BGRA2BGR)

    # Cast floats spanning irregular formats into a bounded [0, 255] discrete spectrum
    if frame.dtype != np.uint8:
        if np.issubdtype(frame.dtype, np.floating):
            frame = np.nan_to_num(frame, nan=0.0, posinf=255.0, neginf=0.0)
        frame = np.clip(frame, 0, 255).astype(np.uint8)

    return frame

def write_video(frames: List[Path], output_path: Path, fps: float, codec: str) -> None:
    """
    Pulls a chronological list of frames and continuously appends them 
    into a structured video buffer container. Resolves shape disparities
    on-the-fly via resolution resizing.
    """
    import cv2

    first = load_bgr_uint8(frames[0])
    h, w = first.shape[:2]

    # Preemptively construct path tree for targets like VideoOutputs/DepthAnythingV2/...
    output_path.parent.mkdir(parents=True, exist_ok=True)
    fourcc = cv2.VideoWriter_fourcc(*codec)
    writer = cv2.VideoWriter(str(output_path), fourcc, fps, (w, h))
    if not writer.isOpened():
        raise RuntimeError(f"VideoWriter failed for {output_path} (codec={codec})")

    try:
        writer.write(first)
        # Step sequentially through sequence injecting each matrix frame to writer
        for fp in frames[1:]:
            img = load_bgr_uint8(fp)
            # Resize image to dimensions initialized dynamically by the first frame
            if (img.shape[0], img.shape[1]) != (h, w):
                img = cv2.resize(img, (w, h), interpolation=cv2.INTER_AREA)
            writer.write(img)
    finally:
        # Closing guarantees valid MP4 header writing
        writer.release()

def parse_args() -> argparse.Namespace:
    """Standard options handler supporting execution variants."""
    p = argparse.ArgumentParser(
        description=__doc__,
        formatter_class=argparse.RawDescriptionHelpFormatter,
    )
    p.add_argument("--input-root", type=Path, default=DEFAULT_INPUT_ROOT,
                   help=f"Root with image folders.  Default: {DEFAULT_INPUT_ROOT}")
    p.add_argument("--output-root", type=Path, default=DEFAULT_OUTPUT_ROOT,
                   help=f"Root for output videos.  Default: {DEFAULT_OUTPUT_ROOT}")
    p.add_argument("--fps", type=float, default=DEFAULT_FPS,
                   help=f"Frames per second.  Default: {DEFAULT_FPS}")
    p.add_argument("--codec", type=str, default=DEFAULT_CODEC,
                   help=f"FourCC codec string.  Default: {DEFAULT_CODEC}")
    p.add_argument("--overwrite", action="store_true",
                   help="Re-create videos that already exist.")
    p.add_argument("--dry-run", action="store_true",
                   help="List planned videos without writing anything.")
    p.add_argument("--min-frames", type=int, default=2,
                   help="Skip folders with fewer frames.  Default: 2")
    return p.parse_args()

def main() -> int:
    args = parse_args()

    # Precautionary module probe
    if not args.dry_run:
        try:
            import cv2   # noqa: F401
            import numpy  # noqa: F401
        except ModuleNotFoundError as e:
            print(f"[ERROR] Missing Python package: {e.name}")
            return 1

    input_root = args.input_root.resolve()
    output_root = args.output_root.resolve()

    if not input_root.is_dir():
        print(f"[ERROR] Input root not found: {input_root}")
        return 1

    exts = DEFAULT_IMAGE_EXTS
    leaf_dirs = collect_leaf_dirs(input_root, exts)

    print(f"Input root  : {input_root}")
    print(f"Output root : {output_root}")
    print(f"Leaf folders: {len(leaf_dirs)}")
    print(f"FPS / Codec : {args.fps} / {args.codec}")
    print()

    created, skipped_exist, skipped_short, failed = 0, 0, 0, 0

    # Iteratively evaluate folders and compile encoded sequences
    for leaf in leaf_dirs:
        frames = sorted_images(leaf, exts)

        # Truncated fragments break visual evaluation; discard sequences with < minimum threshold
        if len(frames) < args.min_frames:
            skipped_short += 1
            print(f"  [SKIP-SHORT] {len(frames)} frames: {leaf.relative_to(input_root)}")
            continue

        rel = leaf.relative_to(input_root)
        video_path = (output_root / rel).with_suffix(".mp4")

        # Ignore if output path is historically populated, ignoring overwrite flag
        if video_path.exists() and not args.overwrite:
            skipped_exist += 1
            print(f"  [EXISTS] {relative_or_abs(video_path, output_root)}")
            continue

        print(f"  [VIDEO] {rel}  ({len(frames)} frames) -> {relative_or_abs(video_path, output_root)}")

        if args.dry_run:
            created += 1
            continue

        try:
            write_video(frames, video_path, args.fps, args.codec)
            created += 1
        except Exception as exc:
            failed += 1
            print(f"  [FAIL]  {relative_or_abs(video_path, output_root)}: {exc}")

    print("\n" + "=" * 50)
    print(f"  Videos created   : {created}")
    print(f"  Skipped (exist)  : {skipped_exist}")
    print(f"  Skipped (short)  : {skipped_short}")
    print(f"  Failed           : {failed}")
    print("=" * 50)

    return 1 if failed else 0

if __name__ == "__main__":
    sys.exit(main())
