import argparse
import os
import random
import csv

import numpy as np
import torch
import torch.nn as nn
import torch.optim as optim
import torch.backends.cudnn as cudnn
from PIL import Image
from torchvision.utils import save_image
from minigpt_utils import visual_attacker, prompt_wrapper
from transformers import CLIPProcessor, CLIPModel

from minigpt4.common.config import Config
from minigpt4.common.dist_utils import get_rank
from minigpt4.common.registry import registry

from curve.bezier_curve import BezierCurve


def parse_args():

    parser = argparse.ArgumentParser(description="Demo")
    parser.add_argument("--cfg_path", default="eval_configs/minigpt4_eval.yaml", help="path to configuration file.")
    parser.add_argument("--gpu_id", type=int, default=0, help="specify the gpu to load the model.")
    parser.add_argument("--n_iters", type=int, default=500, help="specify the number of iterations for attack.")
    parser.add_argument('--eps', type=int, default=32, help="epsilon of the attack budget")
    parser.add_argument('--alpha', type=int, default=1, help="step_size of the attack")
    parser.add_argument("--constrained", default=False, action='store_true')
    parser.add_argument("--control_points", default=1, help="number of the control points in the quadratic Bezier Curve")
    parser.add_argument("--t_size", default=8, help="number of the sampled t in one iteration")
    parser.add_argument("--classifier_dir", type=str, default='classifier',
                        help="classifier directory")
    parser.add_argument("--save_dir", type=str, default='output',
                        help="save directory")

    parser.add_argument(
        "--options",
        nargs="+",
        help="override some settings in the used config, the key-value pair "
             "in xxx=yyy format will be merged into config file (deprecate), "
             "change to --cfg-options instead.",
    )
    args = parser.parse_args()
    return args

def setup_seeds(config):
    seed = config.run_cfg.seed + get_rank()

    random.seed(seed)
    np.random.seed(seed)
    torch.manual_seed(seed)

    cudnn.benchmark = False
    cudnn.deterministic = True

def load_all_clip_models(root_dir="models"):
    models = {}
    processors = {}
    for name in os.listdir(root_dir):
        subdir = os.path.join(root_dir, name)
        if os.path.isdir(subdir):
            try:
                model = CLIPModel.from_pretrained(subdir)
                processor = CLIPProcessor.from_pretrained(subdir)
                models[name] = model
                processors[name] = processor
                print(f"Loaded CLIP model: {name} from {subdir}")
            except Exception as e:
                print(f"Skipping {subdir}: {e}")
    return models, processors

def main():

    # Model Initialization
    print('>>> Initializing Models')

    args = parse_args()
    cfg = Config(args)

    model_config = cfg.model_cfg
    model_config.device_8bit = args.gpu_id
    model_cls = registry.get_model_class(model_config.arch)
    model = model_cls.from_config(model_config).to('cuda:{}'.format(args.gpu_id))
    model.eval()

    vis_processor_cfg = cfg.datasets_cfg.cc_sbu_align.vis_processor.train
    vis_processor = registry.get_processor_class(vis_processor_cfg.name).from_config(vis_processor_cfg)

    print('[Initialization Finished]\n')

    if not os.path.exists(args.save_dir):
        os.mkdir(args.save_dir)

    # Load the expected responses, which is related to the harmful question
    file = open("harmful_corpus/derogatory_corpus.csv", "r")
    data = list(csv.reader(file, delimiter=","))
    file.close()
    targets = []
    num = len(data)
    for i in range(num):
        targets.append(data[i][0])

    # Build Attacker
    my_attacker = visual_attacker.Attacker(args, model, targets, device=model.device, is_rtp=False)

    # Load Original Image
    template_img = 'jailbreak_images/original.jpg'
    img = Image.open(template_img).convert('RGB')
    img = vis_processor(img).unsqueeze(0).to(model.device)

    text_prompt_template = prompt_wrapper.minigpt4_chatbot_prompt_no_text_input

    # Get the two endpoints.
    if not args.constrained:

        jail_img_prompt_start = my_attacker.attack_unconstrained(text_prompt_template,
                                                          img=img, batch_size=8,
                                                          num_iter=2000, alpha=args.alpha / 255)
        jail_img_prompt_end = my_attacker.attack_unconstrained(text_prompt_template,
                                                                img=img, batch_size=8,
                                                                num_iter=2000, alpha=args.alpha / 255)

    else:
        jail_img_prompt_start = my_attacker.attack_constrained(text_prompt_template,
                                                        img=img, batch_size=8,
                                                        num_iter=2000, alpha=args.alpha / 255,
                                                        epsilon=args.eps / 255)
        jail_img_prompt_end = my_attacker.attack_constrained(text_prompt_template,
                                                              img=img, batch_size=8,
                                                              num_iter=2000, alpha=args.alpha / 255,
                                                              epsilon=args.eps / 255)

    # Build the Bezier Curve
    curve = BezierCurve(jail_img_prompt_start, jail_img_prompt_end, args.control_points)
    ctrl_points = nn.ParameterList([
        nn.Parameter(p.clone().detach().to(device)) for p in curve.control_points
    ])

    optimizer = optim.Adam(ctrl_points, lr=1e-2)

    all_models, all_processors = load_all_clip_models(args.classifier_dir)

    # Optimize the path
    jail_con = my_attacker.attack_curve_guided_constrained(curve, optimizer,
                                                    args.t_size,
                                                    all_models, all_processors,
                                                    text_prompt_template,
                                                    batch_size=8,
                                                    num_iter=3000, alpha=args.alpha / 255,
                                                    epsilon=args.eps / 255)
    curve_state = {
        "start": bezier_curve.start.detach().cpu(),
        "end": bezier_curve.end.detach().cpu(),
        "control_points": [cp.detach().cpu() for cp in bezier_curve.control_points]
    }
    save_path = os.path.join(args.save_dir, 'jailbreak_path.pt')
    torch.save(curve_state, save_path)
    print('[Done]')

if __name__ == "__main__":
    main()