#!/usr/bin/env python3
import csv
from pathlib import Path


# Set these paths directly.
SCRIPT_DIR = Path(__file__).resolve().parent
PROJECT_ROOT = SCRIPT_DIR.parent.parent
SUMMARY_DIR = PROJECT_ROOT / "IS-Bench/results/summary"
OUTPUT_PATH = SUMMARY_DIR / "summary_metrics_ordered.csv"


MODEL_ORDER = [
    "InternVL3.5-1B",
    "InternVL3.5-2B",
    "Qwen-3-VL-2B-instruct",
    "Qwen-3-VL-4B-instruct",
    "gemma-3-4b-it",
    "Qwen-3-VL-8B-instruct",
    "gemma-3-12b-it",
    "gemma-3-27b-it",
    "qwen3-vl-30b-a3b-instruct",
    "Qwen-3-VL-32B-instruct",
    "qwen3-vl-235b-a22b-instruct",
    "GPT-4o-mini",
    "GPT-4o",
    "GPT-5.1",
    "Gemini-2.5-Flash",
    "Gemini-2.5-Pro",
    "EMBGuard-2B",
    "EMBGuard-4B",
]


MODEL_NAME_MAP = {
    "OpenGVLab_InternVL3_5-1B-vllm": "InternVL3.5-1B",
    "OpenGVLab_InternVL3_5-2B-Instruct-vllm": "InternVL3.5-2B",
    "Qwen_Qwen3-VL-2B-Instruct-vllm": "Qwen-3-VL-2B-instruct",
    "Qwen_Qwen3-VL-4B-Instruct-vllm": "Qwen-3-VL-4B-instruct",
    "google_gemma-3-4b-it-openrouter": "gemma-3-4b-it",
    "qwen_qwen3-vl-8b-instruct-openrouter": "Qwen-3-VL-8B-instruct",
    "google_gemma-3-12b-it-openrouter": "gemma-3-12b-it",
    "google_gemma-3-27b-it-openrouter": "gemma-3-27b-it",
    "qwen_qwen3-vl-30b-a3b-instruct-openrouter": "qwen3-vl-30b-a3b-instruct",
    "qwen_qwen3-vl-32b-instruct-openrouter": "Qwen-3-VL-32B-instruct",
    "qwen_qwen3-vl-235b-a22b-instruct-openrouter": "qwen3-vl-235b-a22b-instruct",
    "gpt-4o-mini-openai": "GPT-4o-mini",
    "gpt-4o-openai": "GPT-4o",
    "gpt-5.1-openai": "GPT-5.1",
    "gemini-2.5-flash-openrouter": "Gemini-2.5-Flash",
    "gemini-2.5-pro-openrouter": "Gemini-2.5-Pro",
    "EMBGuard_EMBGuard-2B-vllm": "EMBGuard-2B",
    "EMBGuard_EMBGuard-4B-vllm": "EMBGuard-4B",
}


COLUMN_MAP = [
    ("Model", "model_name"),
    ("Precision", "detection_metrics.precision"),
    ("Recall", "detection_metrics.recall"),
    ("F1 score", "detection_metrics.f1_score"),
    ("FalsePositive rate", "detection_metrics.false_positive_rate"),
    ("Safe Step Accuracy", "step_wise_temporal_metrics.safe_step_accuracy"),
    ("Risk Type Accuracy", "risk_type_metrics.risk_type_accuracy"),
    ("Hazard Match Rate", "hazard_explanation_metrics.hazard_match_rate"),
    ("TP", "detection_metrics.confusion_matrix.true_positive"),
    ("FP", "detection_metrics.confusion_matrix.false_positive"),
    ("FN", "detection_metrics.confusion_matrix.false_negative"),
    ("TN", "detection_metrics.confusion_matrix.true_negative"),
]


def read_summary_rows(summary_dir: Path):
    rows = {}
    all_keys = set()
    for csv_path in summary_dir.glob("summary_metrics_*.csv"):
        with csv_path.open("r", encoding="utf-8") as f:
            reader = csv.DictReader(f)
            row = next(reader, None)
        if not row:
            continue
        model_name = row.get("model_name") or csv_path.stem.replace("summary_metrics_", "")
        display_name = MODEL_NAME_MAP.get(model_name, model_name)
        rows[display_name] = row
        all_keys.update(row.keys())
    return rows, all_keys


def main():
    summary_dir = SUMMARY_DIR
    if not summary_dir.exists():
        raise SystemExit(f"Summary directory not found: {summary_dir}")

    rows_by_model, all_keys = read_summary_rows(summary_dir)

    mapped_keys = {k for _, k in COLUMN_MAP}
    extra_keys = sorted(k for k in all_keys if k not in mapped_keys)

    header = [label for label, _ in COLUMN_MAP] + extra_keys
    output_path = OUTPUT_PATH
    output_path.parent.mkdir(parents=True, exist_ok=True)

    with output_path.open("w", encoding="utf-8", newline="") as f:
        writer = csv.writer(f)
        writer.writerow(header)
        for display_name in MODEL_ORDER:
            row = rows_by_model.get(display_name, {})
            row_values = []
            for label, key in COLUMN_MAP:
                if key == "model_name":
                    row_values.append(display_name)
                else:
                    row_values.append(row.get(key, ""))
            for key in extra_keys:
                row_values.append(row.get(key, ""))
            writer.writerow(row_values)

    print(f"Wrote ordered CSV to {output_path}")


if __name__ == "__main__":
    main()
