import os
import random
import sys
sys.path.append(os.getcwd())
import argparse
from collections import OrderedDict

import matplotlib.pyplot as plt
import numpy as np
import json
from scipy.interpolate import make_interp_spline
import seaborn as sns
from matplotlib.ticker import StrMethodFormatter
from config import MODELS_TEST_STANDARD

from matplotlib.ticker import StrMethodFormatter
from matplotlib import rcParams, rc
rcParams['pdf.fonttype'] = 42
rcParams['ps.fonttype'] = 42
rcParams['xtick.direction'] = 'out'
rcParams['ytick.direction'] = 'out'
rc('pdf', fonttype=42)

linestyle_dict = OrderedDict(
    [('solid',               (0, ())),
     ('loosely dotted',      (0, (1, 10))),
     ('dotted',              (0, (1, 5))),
     ('densely dotted',      (0, (1, 1))),

     ('loosely dashed',      (0, (5, 10))),
     ('dashed',              (0, (5, 5))),
     ('densely dashed',      (0, (5, 1))),

     ('loosely dashdotted',  (0, (3, 10, 1, 10))),
     ("dashdot","dashdot"),
     ('dashdotted',          (0, (3, 5, 1, 5))),
     ('densely dashdotted',  (0, (3, 1, 1, 1))),

     ('loosely dashdotdotted', (0, (3, 10, 1, 10, 1, 10))),
     ('dashdotdotted',         (0, (3, 5, 1, 5, 1, 5))),
     ('densely dashdotdotted', (0, (3, 1, 1, 1, 1, 1)))])

def read_json_data(json_path):
    # data_key can be query_success_rate_dict, query_threshold_success_rate_dict, success_rate_to_avg_query
    print("begin read {}".format(json_path))
    with open(json_path, "r") as file_obj:
        data_txt = file_obj.read()
        data_json = json.loads(data_txt)
        distortion_dict = data_json["distortion"]
        surrogate_archs = []
        surrogate_defense_models = []
        surrogate_defense_norms = []
        surrogate_defense_eps = []
        if "surrogate_arch" in data_json["args"] and data_json["args"]["surrogate_arch"] is not None:
            surrogate_archs.append(data_json["args"]["surrogate_arch"])
        elif "surrogate_archs" in data_json["args"] and data_json["args"]["surrogate_archs"] is not None:
            surrogate_archs.extend(data_json["args"]["surrogate_archs"])
        if "surrogate_defense_models" in data_json["args"] and data_json["args"]["surrogate_defense_models"]:
            surrogate_defense_models.extend(data_json["args"]["surrogate_defense_models"])
            if "surrogate_defense_norms" in data_json["args"]:
                surrogate_defense_norms.extend(data_json["args"]["surrogate_defense_norms"])
            if "surrogate_defense_eps" in data_json["args"]:
                surrogate_defense_eps.extend(data_json["args"]["surrogate_defense_eps"])


    return distortion_dict, surrogate_archs, surrogate_defense_models, surrogate_defense_norms, surrogate_defense_eps

surrogate_arch_name_to_paper = {"inceptionresnetv2":"IncResV2", "xception":"Xception", "resnet50":"ResNet50","convit_base":"ConViT",
                                "jx_vit":"ViT", "resnet-110":"ResNet110", "senet154":"SENet154", "densenet-bc-100-12":"DenseNetBC100",
                                "densenet-bc-L190-k40":"DenseNetBC190", "vgg13_bn":"VGG13", "WRN-28-10":"WRN28"}
def read_all_data(dataset_path_dict, arch, query_budgets, stats="mean_distortion"):
    # dataset_path_dict {("CIFAR-10","l2","untargeted"): "/.../"， }
    data_info = {}
    for (dataset, norm, targeted, method), dir_path in dataset_path_dict.items():
        for file_path in os.listdir(dir_path):
            # 情况1：arch是resnet-50_adv_train，但是文件名是resnet-50_surrogates_resnet-110,densenet-bc-100-12_adv_train_result.json
            # 情况2：arch是resnet50_adv_train_on_ImageNet_l2_3，但是文件名是resnet50_surrogates_resnet50,senet154_adv_train_on_ImageNet_l2_3_result.json或者resnet50(adv_train_l2_3)_surrogates_adv_train_linf_4_div_255(resnet50),adv_train_linf_8_div_255(resnet50)_result.json
            if file_path.startswith(arch) or file_path.startswith(arch_translation[arch]) and file_path.endswith(".json"):
                file_path = dir_path + "/" + file_path
                distortion_dict, surrogate_archs, surrogate_defense_models, surrogate_defense_norms, surrogate_defense_eps= read_json_data(file_path)
                x = []
                y = []
                for query_budget in query_budgets:
                    if not targeted and method == "BA" and query_budget<1000:
                        print("Skip boundary attack at {} query budgets".format(query_budget))
                        continue
                    distortion_list = []
                    for image_id, query_distortion_dict in distortion_dict.items():
                        query_distortion_dict = {int(float(query)): float(dist) for query, dist in query_distortion_dict.items()}
                        queries = np.array(list(query_distortion_dict.keys()))
                        queries = np.sort(queries)
                        find_index = np.searchsorted(queries, query_budget, side='right') - 1
                        if query_budget < queries[find_index]:
                            print(
                                "query budget is {}, find query is {}, min query is {}, len query_distortion is {}".format(
                                    query_budget, queries[find_index], np.min(queries).item(),
                                    len(query_distortion_dict)))
                            continue
                        distortion_list.append(query_distortion_dict[queries[find_index]])
                    distortion_list = np.array(distortion_list)
                    distortion_list = distortion_list[~np.isnan(distortion_list)]  # 去掉nan的值
                    mean_distortion = np.mean(distortion_list)
                    median_distortion = np.median(distortion_list)
                    x.append(query_budget)
                    if stats == "mean_distortion":
                        y.append(mean_distortion)
                    elif stats == "median_distortion":
                        y.append(median_distortion)
                x = np.array(x)
                y = np.array(y)
                surrogate_archs_string = []
                for idx, surrogate_arch in enumerate(surrogate_archs):
                    if surrogate_defense_models:
                        surrogate_defense_model = surrogate_defense_models[idx]
                        if surrogate_defense_model.startswith("adv_train"):
                            surrogate_defense_model = "AT"
                        elif surrogate_defense_model == "feature_scatter":
                            surrogate_defense_model = "FS"
                        if dataset == "CIFAR-10":
                            surrogate_archs_string.append("{}({})".format(surrogate_defense_model,
                                                                      surrogate_arch_name_to_paper[surrogate_arch]))
                        else:
                            eps = surrogate_defense_eps[idx]
                            if surrogate_defense_eps[idx] == "4_div_255":
                                eps = "\\frac{{4}}{{255}}"
                            elif surrogate_defense_eps[idx] == "8_div_255":
                                eps = "\\frac{{8}}{{255}}"
                            surrogate_archs_string.append("{}({},\epsilon_{{{}}}={})".format(surrogate_defense_model,
                                                                          surrogate_arch_name_to_paper[surrogate_arch],"\ell_\infty" if surrogate_defense_norms[idx] == "linf" else "\ell_2",
                                                                          eps))
                    else:
                        surrogate_archs_string.append(surrogate_arch_name_to_paper[surrogate_arch])
                data_info[(dataset, norm, targeted, method, "&".join(surrogate_archs_string))] = (x,y)
    return data_info




method_name_to_paper = {"tangent_attack":"TA",
                        "ellipsoid_tangent_attack":"G-TA", "GeoDA":"GeoDA",
                        "HSJA":"HSJA", "SignOPT":"Sign-OPT", "SVMOPT":"SVM-OPT",
                         "Evolutionary":"Evolutionary", "SurFree":"SurFree",
                        "TriangleAttack":"Triangle Attack", "PriorSignOPT":"Prior-Sign-OPT",
                        "PriorOPT":"Prior-OPT", "RayS":"RayS"
                        #"QEBA":"QEBA", "CGBA_H":"CGBA-H"
                        }
# method_name_to_paper = {
#                         "PriorOPT":"Prior-OPT","RayS":"RayS"
#                         #"QEBA":"QEBA", "CGBA_H":"CGBA-H"
#                         }
def from_method_to_dir_path(dataset, method, norm, targeted):
    if method == "tangent_attack" or method == "ellipsoid_tangent_attack":
        path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method, dataset=dataset,
                                                                norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "HSJA":
        path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method, dataset=dataset,
                                                                norm=norm,  target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "GeoDA" or method == "RayS" or method == "SurFree" or method == "Evolutionary" or method == "TriangleAttack" or method == "PriorOPT" or method == "PriorSignOPT":
        path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method, dataset=dataset,
                                                                norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "biased_boundary_attack":
        path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method,dataset=dataset,norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "boundary_attack":
        path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method,dataset=dataset,norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "RayS":
        path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method,dataset=dataset,norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "SignOPT":
        if targeted:
            path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method, dataset=dataset, norm=norm,
                                                                   target_str="untargeted" if not targeted else "targeted_increment")
        else:
            path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method,dataset=dataset,norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    elif method == "SVMOPT":
        if targeted:
            path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method, dataset=dataset, norm=norm,
                                                                   target_str="untargeted" if not targeted else "targeted_increment")
        else:
            path = "{method}_on_defensive_model-{dataset}-{norm}-{target_str}".format(method=method,dataset=dataset,norm=norm, target_str="untargeted" if not targeted else "targeted_increment")
    return path

def get_all_exists_folder(dataset, methods, norm, targeted):
    root_dir = "G:/logs/hard_label_attacks/"
    dataset_path_dict = {}  # dataset_path_dict {("CIFAR-10","l2","untargeted", "NES"): "/.../"， }
    for method in methods:
        file_name = from_method_to_dir_path(dataset, method, norm, targeted)
        file_path = root_dir + file_name
        if os.path.exists(file_path):
            dataset_path_dict[(dataset, norm, targeted, method_name_to_paper[method])] = file_path
        else:
            print("{} does not exist!!!".format(file_path))
    return dataset_path_dict

method_linestyle_mark_dict = {}
def draw_query_distortion_figure(dataset, norm, targeted, arch, fig_type, dump_file_path, xlabel, ylabel):

    # fig_type can be [query_success_rate_dict, query_threshold_success_rate_dict, success_rate_to_avg_query]
    methods = list(method_name_to_paper.keys())
    if targeted:
        methods.remove("TriangleAttack")
        methods.remove("RayS")
    if norm == "l2":
        methods.remove("RayS")
    elif norm == "linf":
        methods.remove("TriangleAttack")
        methods.remove("SurFree")
        methods.remove("Evolutionary")

    dataset_path_dict= get_all_exists_folder(dataset, methods, norm, targeted)
    max_query = 10000
    if dataset == "ImageNet":
        max_query = 20000
    query_budgets = np.arange(1000, max_query+1, 1000)
    data_info = read_all_data(dataset_path_dict, arch, query_budgets, fig_type)  # fig_type can be mean_distortion or median_distortion
    plt.style.use('seaborn-v0_8-whitegrid')
    # from matplotlib import rcParams, rc
    # rcParams['xtick.direction'] = 'out'
    # rcParams['ytick.direction'] = 'out'
    # rcParams['pdf.fonttype'] = 42
    # rcParams['ps.fonttype'] = 42
    # rc('pdf', fonttype=42)

    plt.figure(figsize=(10, 8))
    colors = ['b', 'g', 'c', 'm', 'y', 'k', 'orange', "pink", "brown", "slategrey", "cornflowerblue",
              "greenyellow", "darkgoldenrod", "r", "slategrey", "navy", "darkseagreen", "xkcd:blueberry", "grey",
              "indigo", "olivedrab"]
    markers = ['o', '>', '*', 's', "P", "p", "X", "h", "D", "H", "^", "<", "d", ".", "+", "x", "v", "1", "2", "3", "4"]
    linestyles = ["solid", "dashed", "densely dotted", "dashdotdotted", "densely dashed", "densely dashdotdotted"]


    xtick = np.array([ 0, 1000, 2000, 3000, 4000, 5000, 6000, 7000, 8000, 9000, 10000])
    if max_query == 20000:
        xtick = np.array([ 0, 1000, 2000, 3000, 4000, 5000, 6000, 7000, 8000, 9000, 10000,11000,12000,13000,14000,15000,16000,17000,18000,19000,20000])
    max_y = 0
    min_y= 999
    all_used_colors = set()
    for idx, ((dataset, norm, targeted, method, surrogate_archs), (x,y)) in enumerate(data_info.items()):
        x = np.asarray(x)
        y = np.asarray(y)
        if np.max(y) > max_y:
            max_y = np.max(y)
        if np.min(y) < min_y:
            min_y = np.min(y)
        if surrogate_archs:
            method = method + "$_{\mathrm{"+ surrogate_archs + "}}$"
        # if method not in method_linestyle_mark_dict:
        linestyle = linestyle_dict[linestyles[idx % len(linestyles)]]
        mark = markers[idx]
        if method not in method_linestyle_mark_dict:
            linestyle = linestyle_dict[linestyles[idx % len(linestyles)]]
            mark = markers[idx]
            color = colors[idx]

            # color = colors[idx]

            for_loop_count = 0
            all_use_color = False
            all_use_mark = False
            while color in [tuple_value[2] for tuple_value in
                            method_linestyle_mark_dict.values()]:
                color = random.choice(colors)
                while color in all_used_colors:
                    color = random.choice(colors)

                for_loop_count += 1
                if for_loop_count > 1000:
                    all_use_color = True
                    break
            for_loop_count = 0
            while mark in [tuple_value[1] for tuple_value in
                           method_linestyle_mark_dict.values()]:
                mark = random.choice(markers)
                for_loop_count += 1
                if for_loop_count > 1000:
                    all_use_mark = True
                    break
            if all_use_color or all_use_mark:
                while (mark, color) in [(tuple_value[1], tuple_value[2]) for tuple_value in
                                        method_linestyle_mark_dict.values()]:
                    color = random.choice(colors)
                    while color in all_used_colors:
                        color = random.choice(colors)
                    mark = random.choice(markers)

            method_linestyle_mark_dict[method] = (linestyle, mark, color)
        selected_color = method_linestyle_mark_dict[method][2]
        while selected_color in all_used_colors:
            selected_color = random.choice(colors)
        method_linestyle_mark_dict[method] = (
            method_linestyle_mark_dict[method][0], method_linestyle_mark_dict[method][1], selected_color)
        all_used_colors.add(selected_color)
        plt.plot(x, y, label=method, color=selected_color,
                         linestyle=method_linestyle_mark_dict[method][0], linewidth=1.5,
                         marker=method_linestyle_mark_dict[method][1], markersize=6, alpha=0.8)

    if norm == "linf":
        plt.gca().yaxis.set_major_formatter(StrMethodFormatter('{x:,.2f}'))
    else:
        plt.gca().yaxis.set_major_formatter(StrMethodFormatter('{x:,.0f}'))
    if dataset == "ImageNet":
        plt.xlim(0, max_query + 1000)
    else:
        plt.xlim(0, max_query)
    plt.ylim(0, max_y+0.1)
    plt.gcf().subplots_adjust(bottom=0.15)
    print("max y is {}".format(max_y))

    if dataset == "ImageNet":
        x_ticks = xtick[0::2]
        x_ticks = x_ticks.tolist()
        x_ticks_label = ["0"] + ["{}K".format(x_tick // 1000) for x_tick in x_ticks[1:]]
        plt.xticks(x_ticks, x_ticks_label, fontsize=20)
    else:
        x_ticks_label = ["0"] + ["{}K".format(x_tick // 1000) for x_tick in xtick[1:]]
        plt.xticks(xtick, x_ticks_label, fontsize=20)
    if dataset=="ImageNet":
        if norm == "l2":
            yticks = np.arange(0, max_y + 1, 5)
        else:
            yticks = np.linspace(0, max_y+0.1,11)
    else:
        if norm == "l2":
            yticks = np.arange(0, max_y+1)
        else:
            yticks = np.linspace(0, max_y+0.1, 11)
    plt.yticks(yticks, fontsize=20)
    plt.xlabel(xlabel, fontsize=25)
    plt.ylabel(ylabel, fontsize=25)

    if "jpeg" in dump_file_path:
        plt.legend(loc='upper right', prop={'size': 15},
                   handlelength=4,framealpha=0.5,fancybox=True,frameon=True)
    elif "ImageNet" == dataset:
        plt.legend(loc='upper right', prop={'size': 15},
                   handlelength=4,framealpha=0.5,fancybox=True,frameon=True)
    elif ("com_defend" in dump_file_path or "feature_distillation" in dump_file_path) and "CIFAR-10" == dataset and targeted:
        plt.legend(loc='upper right', prop={'size': 15},handlelength=4,framealpha=0.5,fancybox=True,frameon=True)
    else:
        plt.legend(loc='upper right', prop={'size': 15},handlelength=4,framealpha=0.5,fancybox=True,frameon=True)
    plt.savefig(dump_file_path, dpi=200)
    plt.close()
    print("save to {}".format(dump_file_path))

def parse_args():
    parser = argparse.ArgumentParser(description='Drawing Figures of Attacking Normal Models')
    parser.add_argument("--fig_type", type=str, choices=["mean_distortion",
                                                         "median_distortion"])
    parser.add_argument("--dataset", type=str, help="the dataset to train")
    parser.add_argument("--norm", type=str, default="l2", choices=["l2", "linf"])
    parser.add_argument("--targeted", action="store_true", help="Does it train on the data of targeted attack?")
    args = parser.parse_args()
    return args


arch_translation = {"resnet-50(TRADES_linf_8_div_255)":"resnet-50_TRADES", "resnet-50(jpeg)":"resnet-50_jpeg",
                    "resnet-50(feature_scatter_linf_16_div_255)":"resnet-50_feature_scatter","resnet-50(feature_distillation)":"resnet-50_feature_distillation",
                    "resnet-50(com_defend)":"resnet-50_com_defend", "resnet-50(AT_linf_8_div_255)":"resnet-50_adv_train",
                    "resnet50(AT_l2_3)":"resnet50_adv_train_on_ImageNet_l2_3","resnet50(AT_linf_4_div_255)":"resnet50_adv_train_on_ImageNet_linf_4_div_255",
                    "resnet50(AT_linf_8_div_255)":"resnet50_adv_train_on_ImageNet_linf_8_div_255"}

if __name__ == "__main__":
    args = parse_args()
    dump_folder = "D:/黑盒攻击论文/hard-label attacks/Prior-OPT/ICLR 2025/figures/query_vs_distortion/attack_defense/"
    os.makedirs(dump_folder, exist_ok=True)
    for norm in ["l2"]:
        for dataset in ["ImageNet","CIFAR-10"]:
            args.norm = norm
            for targeted in [False]:
                if "CIFAR" in dataset:
                    archs = ["resnet-50(AT_linf_8_div_255)", 'resnet-50(TRADES_linf_8_div_255)']
                else:
                    archs= ["resnet50(AT_linf_4_div_255)", "resnet50(AT_l2_3)",
                            "resnet50(AT_linf_8_div_255)"]
                for model in archs:
                    file_path = dump_folder + "{dataset}_{model}_{norm}_{target_str}_attack.pdf".format(dataset=dataset,
                                  model=model, norm=args.norm, target_str="untargeted" if not targeted else "targeted")
                    x_label = "Number of Queries"
                    if args.fig_type == "mean_distortion" and args.norm == "l2":
                        y_label = "Mean $\ell_2$ Distortion"
                    elif args.fig_type == "median_distortion" and args.norm == "l2":
                        y_label = "Median $\ell_2$ Distortion"
                    elif args.fig_type == "mean_distortion" and args.norm == "linf":
                        y_label = "Mean $\ell_\infty$ Distortion"
                    elif args.fig_type == "median_distortion" and args.norm == "linf":
                        y_label = "Median $\ell_\infty$ Distortion"
                    draw_query_distortion_figure(dataset, args.norm, targeted, model, args.fig_type, file_path,x_label,y_label)

