import os
import sys
import yaml
import argparse
import logging
import pandas as pd
from datetime import datetime

project_root = os.path.abspath(os.path.join(os.path.dirname(__file__), ".."))
if project_root not in sys.path:
    sys.path.insert(0, project_root)

from generators.vanilla_endowment_generator import EndowmentGenerator
from modules.token_tracker import MultiAxisTokenTracker


def load_config(path: str) -> dict:
    with open(path, "r") as f:
        return yaml.safe_load(f)


def generate_vanilla_endowments(config_path: str):
    # === Load config
    cfg = load_config(config_path)

    meta = cfg.get("metadata", {})
    name = meta.get("name", "vanilla_generation")

    # ============================================================
    #          OUTPUT DIRECTORY TAKEN FROM YAML
    # ============================================================
    yaml_output = cfg.get("output_dir")
    if yaml_output is None or str(yaml_output).strip() == "":
        # fallback if not provided
        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
        output_dir = os.path.join("outputs", f"{name}_{timestamp}")
    else:
        output_dir = yaml_output

    os.makedirs(output_dir, exist_ok=True)
    print(f"[INFO] Using output_dir = {output_dir}")

    # === Logger
    log_path = os.path.join(output_dir, "vanilla_generation.log")
    logger = logging.getLogger("vanilla_endowment_logger")
    logger.setLevel(logging.INFO)
    logger.handlers = []

    formatter = logging.Formatter("%(asctime)s [%(levelname)s] %(message)s")

    fh = logging.FileHandler(log_path)
    fh.setFormatter(formatter)
    logger.addHandler(fh)

    ch = logging.StreamHandler(sys.stdout)
    ch.setFormatter(formatter)
    logger.addHandler(ch)

    logger.info(f"[Vanilla] Output directory: {output_dir}")

    # === Token tracker
    tracker = MultiAxisTokenTracker()

    # === Generator initialization
    gen_cfg = cfg.get("endowment_generator", {})
    generator = EndowmentGenerator(
        backend_type=gen_cfg.get("backend", "openai"),
        model_name=gen_cfg.get("model_name", "gpt-4o-mini"),
        temperature=gen_cfg.get("temperature", 0.9),
        max_tokens=gen_cfg.get("max_tokens", 1024),
        batch_size=gen_cfg.get("batch_size", 10),
        delay=gen_cfg.get("delay", 0.5),
        retry_failed=gen_cfg.get("retry_failed", True),
        clear_after_run=False,
        token_tracker=tracker,
        verbose=True,
    )

    # === Generate endowments
    n = gen_cfg.get("n_endowments", 1000)
    topic = gen_cfg.get("topic_description")

    logger.info(f"[Vanilla] Generating {n} endowments...")
    endowments = generator.generate(n, topic_description=topic)

    # === Save JSONL
    jsonl_name = f"vanilla_{n}.jsonl"
    jsonl_path = os.path.join(output_dir, jsonl_name)
    generator.save(jsonl_path)
    logger.info(f"[Vanilla] Saved JSONL to {jsonl_path}")

    # === Save CSV with automatic naming: vanilla_{n}.csv
    csv_name = f"vanilla_{n}.csv"
    csv_path = os.path.join(output_dir, csv_name)

    df = pd.DataFrame(endowments)
    df.to_csv(csv_path, index=False)

    logger.info(f"[Vanilla] Saved endowments CSV to {csv_path}")

    # === Save token usage
    tracker_csv = os.path.join(output_dir, "token_usage.csv")
    tracker.save(tracker_csv)
    with open(os.path.join(output_dir, "token_report.md"), "w") as f:
        f.write(tracker.report())

    logger.info(f"[Vanilla] Token usage saved to {tracker_csv}")

    logger.info("[Vanilla] Generation complete.")

    return output_dir, csv_path


if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Generate vanilla endowments only (no regression)")
    parser.add_argument("--config", type=str, required=True)
    args = parser.parse_args()

    generate_vanilla_endowments(args.config)