import os
import torch
import argparse
import numpy as np
from PIL import Image
from glob import glob
from tqdm import tqdm
from torchvision.transforms.functional import pil_to_tensor

from pq_utils import (
    get_metrics,
    set_seed,
    apply_single_distortion,
    get_init_latent,
    get_img_tensor,
)

from diffusers import DDIMScheduler
from utils.wm.wm_utils import WmProviders
from main.wmdiffusion import WMDetectStableDiffusionPipeline

from main.attdiffusion import ReSDPipeline
from main.wmattacker import (
    DiffWMAttacker,
    VAEWMAttacker,
    JPEGAttacker,
    RotateAttacker,
    BrightnessAttacker,
    ContrastAttacker,
    GaussianNoiseAttacker,
    GaussianBlurAttacker,
    BM3DAttacker,
)

parser = argparse.ArgumentParser(description="Configuration for image watermarking and generation.")
parser.add_argument('--wm_type', type=str, default='PQ', choices=['GS', 'TR', 'PQ'], help='Watermark type to use (GS, TR or PQ).')
parser.add_argument('--payload_bits', default=256, type=int)
parser.add_argument('--q_step', default=np.pi, type=float)
parser.add_argument('--n_bins', default=20, type=int)
parser.add_argument('--r_min_ratio', default=0.1, type=float)
parser.add_argument('--r_max_ratio', default=0.7, type=float)
parser.add_argument('--amp_threshold_percentile', default=100, type=int)
parser.add_argument('--seed', type=int, default=42, help='Random seed for reproducibility.')
parser.add_argument('--device', type=str, default='cuda:3', help='Device to run on (e.g., "cuda:0", "cpu").')
parser.add_argument('--attack_name', type=str, 
                    default='JPEG', 
                    # default='GaussianBlur', 
                    # default='GaussianNoise', 
                    # default='Brightness', 
                    # default='Resize', 
                    # default='SPNoise', 
                    help='')
args = parser.parse_args()

set_seed(args.seed)

device=args.device
source_dir = 'gen_pqim'
gt_dir = 'output_images_wo_wm'
source_files = glob(f'{source_dir}/**.png')
gt_files = glob(f'{gt_dir}/**.png')
source_files.sort()
gt_files.sort()

# source_files = source_files[:10]
# gt_files = gt_files[:10]

### varify sorting ###
assert len(source_files) == len(gt_files), \
    f'length of source_files and gt_files mismatched, {len(source_files)} != {len(gt_files)}'

for source_file, gt_file in zip(source_files, gt_files):
    source_name = os.path.basename(source_file).split('-')[0]
    gt_name = os.path.basename(gt_file).split('.')[0]
    assert source_name == gt_name, f'source and gt sorting dismatched, {source_name} != {gt_name}'
### varify sorting ###


attack_names = [
    [args.attack_name],
]

attack_params = {
    'jpeg_ratio': 25,
    'gaussian_blur_r': 5,
    'gaussian_std': 0.1,
    'brightness_factor': 2,
    'resize_ratio': 0.5,
    'sp_prob': 0.2,
}

scheduler = DDIMScheduler.from_pretrained(
    'stabilityai/stable-diffusion-2-1-base',
    subfolder="scheduler"
)
pipe = WMDetectStableDiffusionPipeline.from_pretrained(
    'stabilityai/stable-diffusion-2-1-base',
    scheduler=scheduler
).to(device)
pipe.set_progress_bar_config(disable=True)

invert_text_embedding = pipe.get_text_embedding('')

latent_shape = (1, 4, 64, 64)
wm_provider = WmProviders[args.wm_type].value(
    latent_shape=latent_shape,
    **vars(args),
)

source_save_dir = source_dir + f'_{args.attack_name}'
os.makedirs(source_save_dir, exist_ok=True)
gt_save_dir = gt_dir + f'_{args.attack_name}'
os.makedirs(gt_save_dir, exist_ok=True)
for attack_name in attack_names:
    print(f'Running {attack_name} ...')
    
    w_latents = []
    nw_latents = []
    for gt_file, source_file in tqdm(zip(gt_files, source_files), total=len(source_files)):
        wm_image = Image.open(source_file)
        gt_image = Image.open(gt_file)

        att_wm_image = apply_single_distortion(wm_image, attack_name, attack_params)
        att_gt_image = apply_single_distortion(gt_image, attack_name, attack_params)

        # att_wm_image.save(os.path.join(source_save_dir, os.path.basename(source_file)))
        # att_gt_image.save(os.path.join(gt_save_dir, os.path.basename(gt_file)))

        att_wm_tensor = (pil_to_tensor(att_wm_image) / 255).unsqueeze(0).to(device)
        att_gt_tensor = (pil_to_tensor(att_gt_image) / 255).unsqueeze(0).to(device)
        att_wm_latents = get_init_latent(
            img_tensor=att_wm_tensor,
            pipe=pipe,
            text_embeddings=invert_text_embedding,
        )
        att_gt_latents = get_init_latent(
            img_tensor=att_gt_tensor,
            pipe=pipe,
            text_embeddings=invert_text_embedding,
        )

        torch.save(att_wm_latents, os.path.join(source_save_dir, os.path.basename(source_file)).replace('png','pt'))
        torch.save(att_gt_latents, os.path.join(gt_save_dir, os.path.basename(gt_file)).replace('png','pt'))

        w_latents.append(att_wm_latents)
        nw_latents.append(att_gt_latents)

    tpr, mean_w_acc = get_metrics(w_latents, nw_latents, wm_provider)
    
    print('-'*50)
    print(f'[{attack_name}] | TPR: {tpr} | ACC: {mean_w_acc}')
    print('-'*50)

        
print(0)

