


import os
os.environ.setdefault("MPLCONFIGDIR", "/tmp/matplotlib")

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from pathlib import Path


def _resolve_paths():
    base_dir = Path(__file__).resolve().parent if "__file__" in globals() else Path.cwd()
    root_dir = base_dir
    while root_dir != root_dir.parent and not (root_dir / "final_results").is_dir():
        root_dir = root_dir.parent
    drawing_dir = base_dir
    results_dir = root_dir / "final_results"
    rank_dir = results_dir / "ranking" / "nlp_cv"
    fig_dir = results_dir / "figures"
    fig_dir.mkdir(parents=True, exist_ok=True)
    return root_dir, drawing_dir, results_dir, rank_dir, fig_dir


PROJECT_DIR, DRAWING_DIR, RESULTS_DIR, RANK_DIR, FIG_DIR = _resolve_paths()


def Draw_time_train(file_path, output_path):
    data = pd.read_csv(file_path)
    if data.empty:
        print(f"The file {file_path} is empty or does not contain valid data.")
        return

    time_train_col = "Time Train" if "Time Train" in data.columns else "Time train"
    if time_train_col not in data.columns:
        raise ValueError(f"Missing column '{time_train_col}' in {file_path}")

    relevant_data = data[["Model", time_train_col]].copy()
    relevant_data = relevant_data.rename(columns={time_train_col: "Time Train"})

    group_mapping = {
        : "Traditional", "CBLOF": "Traditional", "KNN": "Traditional",
        : "Traditional", "HBOS": "Traditional", "PCA": "Traditional",
        : "Traditional", "COF": "Traditional", "LODA": "Traditional",
        : "Traditional", "COPOD": "Traditional", "IForest": "Traditional",
        : "Traditional", "PMKFN": "Traditional", "KNFST": "Traditional",

        : "Deep Learning", "AE1SVM": "Deep Learning",
        : "Deep Learning", "LUNAR": "Deep Learning", "ALAD": "Deep Learning",
        : "Deep Learning", "NeuTraLAD": "Deep Learning", "DRLAD": "Deep Learning",
        : "Deep Learning", "DIF": "Deep Learning", "AnoGAN": "Deep Learning",
        : "Deep Learning", "SO_GAAL": "Deep Learning",

        : "Proposed"
    }
    relevant_data["Group"] = relevant_data["Model"].map(group_mapping)

    group_order = ["Traditional", "Deep Learning", "Proposed"]
    model_order = []
    for group in group_order:
        models = relevant_data[relevant_data["Group"] == group]["Model"].unique()
        model_order.extend(models)

    relevant_data["Model"] = pd.Categorical(relevant_data["Model"], categories=model_order, ordered=True)

    group_colors = {
        : "#ADD8E6",
        : "#98FB98",
        : "#FFB6C1"
    }
    traditional_models = relevant_data[relevant_data["Group"] == "Traditional"]["Model"].unique()
    deep_models = relevant_data[relevant_data["Group"] == "Deep Learning"]["Model"].unique()

    palette = {}
    palette.update({model: sns.color_palette("Blues", len(traditional_models))[i]
                    for i, model in enumerate(traditional_models)})
    palette.update({model: sns.color_palette("Greens", len(deep_models))[i]
                    for i, model in enumerate(deep_models)})
    palette["DVM-AD"] = "#FFB6C1"

    plt.figure(figsize=(14, 6))
    ax = sns.boxplot(data=relevant_data, x="Model", y="Time Train", hue="Model", palette=palette, dodge=False)
    if ax.get_legend() is not None:
        ax.get_legend().remove()

    current_x = -0.5
    for group in group_order:
        count = relevant_data[relevant_data["Group"] == group]["Model"].nunique()
        plt.axvspan(current_x, current_x + count, color=group_colors[group], alpha=0.3)
        current_x += count

    plt.yscale('log')
    plt.ylabel("Training Time (log seconds)", fontsize=12)
    plt.xlabel("Models", fontsize=12)
    plt.xticks(rotation=45, ha="right")
    plt.tight_layout()

    os.makedirs(os.path.dirname(output_path), exist_ok=True)
    plt.savefig(output_path, dpi=300)
    plt.close()

    print(f"Plot saved to {output_path}")


def Draw_time_test(file_path, output_path):
    data = pd.read_csv(file_path)
    if data.empty:
        print(f"The file {file_path} is empty or does not contain valid data.")
        return

    time_test_col = "Time Test" if "Time Test" in data.columns else "Time test"
    if time_test_col not in data.columns:
        raise ValueError(f"Missing column '{time_test_col}' in {file_path}")

    relevant_data = data[["Model", time_test_col]].copy()
    relevant_data = relevant_data.rename(columns={time_test_col: "Time Test"})

    group_mapping = {
        : "Traditional", "CBLOF": "Traditional", "KNN": "Traditional",
        : "Traditional", "HBOS": "Traditional", "PCA": "Traditional",
        : "Traditional", "COF": "Traditional", "LODA": "Traditional",
        : "Traditional", "COPOD": "Traditional", "IForest": "Traditional",
        : "Traditional", "PMKFN": "Traditional", "KNFST": "Traditional",

        : "Deep Learning", "AE1SVM": "Deep Learning",
        : "Deep Learning", "LUNAR": "Deep Learning", "ALAD": "Deep Learning",
        : "Deep Learning", "NeuTraLAD": "Deep Learning", "DRLAD": "Deep Learning",
        : "Deep Learning", "DIF": "Deep Learning", "AnoGAN": "Deep Learning",
        : "Deep Learning", "SO_GAAL": "Deep Learning",

        : "Proposed"
    }
    relevant_data["Group"] = relevant_data["Model"].map(group_mapping)

    group_order = ["Traditional", "Deep Learning", "Proposed"]
    model_order = []
    for group in group_order:
        models = relevant_data[relevant_data["Group"] == group]["Model"].unique()
        model_order.extend(models)

    relevant_data["Model"] = pd.Categorical(relevant_data["Model"], categories=model_order, ordered=True)

    group_colors = {
        : "#ADD8E6",
        : "#98FB98",
        : "#FFB6C1"
    }
    traditional_models = relevant_data[relevant_data["Group"] == "Traditional"]["Model"].unique()
    deep_models = relevant_data[relevant_data["Group"] == "Deep Learning"]["Model"].unique()

    palette = {}
    palette.update({model: sns.color_palette("Blues", len(traditional_models))[i]
                    for i, model in enumerate(traditional_models)})
    palette.update({model: sns.color_palette("Greens", len(deep_models))[i]
                    for i, model in enumerate(deep_models)})
    palette["DVM-AD"] = "#FFB6C1"

    plt.figure(figsize=(14, 6))
    ax = sns.boxplot(data=relevant_data, x="Model", y="Time Test", hue="Model", palette=palette, dodge=False)
    if ax.get_legend() is not None:
        ax.get_legend().remove()

    current_x = -0.5
    for group in group_order:
        count = relevant_data[relevant_data["Group"] == group]["Model"].nunique()
        plt.axvspan(current_x, current_x + count, color=group_colors[group], alpha=0.3)
        current_x += count

    plt.yscale('log')
    plt.ylabel("Testing Time (log seconds)", fontsize=12)
    plt.xlabel("Models", fontsize=12)
    plt.xticks(rotation=45, ha="right")
    plt.tight_layout()

    os.makedirs(os.path.dirname(output_path), exist_ok=True)
    plt.savefig(output_path, dpi=300)
    plt.close()

    print(f"Plot saved to {output_path}")



RANK_FILES = {
    : "dvmad_result_nlp_cv_10_datasets_rank.csv",
    : "dvmad_result_tabular_47_datasets_rank.csv",
}

for label, filename in RANK_FILES.items():
    file_path = RANK_DIR / filename
    if not file_path.exists():
        print(f"Missing file: {file_path}")
        continue

    Draw_time_train(file_path, FIG_DIR / f"Time_train_{label}.png")
    Draw_time_test(file_path, FIG_DIR / f"Time_test_{label}.png")
