import torch
import numpy as np
import onnxruntime as ort
import cv2
from PIL import Image
import os
import sys
import pathlib
from torchvision import transforms
import gc
sys.path.append(str(pathlib.Path(__file__).resolve().parents[2]))
root_dir = pathlib.Path(__file__).resolve().parents[2]
sys.path.append(root_dir)
from utils import plot_logits_to_mask


reach_factory_path = os.path.join(root_dir, 'Reach_Factory')
sys.path.append(reach_factory_path)
from Provision_All import Reachability_provider
from Segmentation import Segmentor




def Camvid_exp1(delta_rgb,  Nt, N_dir, image_name,
                  Ns, Nsp, rank, device,  threshold_normal,
                  sim_batch, trn_batch, surrogate_mode):
    
    
    de = delta_rgb / 255.0
    model_name = 'BiSeNet.onnx'

    current_dir = os.getcwd()
    model_path = os.path.join(current_dir, 'models', model_name)
    image_path = os.path.join(current_dir, 'images', image_name)

    ort_session = ort.InferenceSession(model_path, providers=['CUDAExecutionProvider'])
    
    img = cv2.imread(image_path)  # BGR format
    img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
    img = cv2.resize(img, (960, 720))  # Ensure correct input size
    img_np = img.astype(np.float32) / 255.0  # [H, W, 3] float32 in [0, 1]
    img_np = np.transpose(img_np, (2, 0, 1))  # [3, 720, 960]
    img_np = img_np.reshape(1, 3, 720, 960)

    # --- Normalize image ---
    mean_vals = np.array([0.485, 0.456, 0.406]).reshape(1, 3, 1, 1)
    std_vals = np.array([0.229, 0.224, 0.225]).reshape(1, 3, 1, 1)


    img_norm = (img_np - mean_vals) / std_vals
    img_tensor = torch.from_numpy(img_norm).to(device)
    x = img_tensor.to(torch.float16)  # Use half precision
    x_numpy = x.cpu().numpy().astype(np.float32)
    output = ort_session.run(None, {'input': x_numpy})
    output = torch.tensor(output[0]).to(device)
    
    plot_logits_to_mask(output)

    output_dim = output.shape

    _, True_class_tensor = torch.max(output, dim=1)  # shape: (1, 720, 960)
    True_class_tensor = True_class_tensor.squeeze(0)  # shape: (720, 960)
    True_class = True_class_tensor.cpu().tolist()

    Cent = img_tensor
    
    
    
    params = {
        'sim_batch' : sim_batch,
        'Nt' : Nt,
        'N_dir' : N_dir,
        'trn_batch' : trn_batch,
        'threshold_normal' : threshold_normal,
        'Ns' : Ns,
        'Nsp' : Nsp,
        'rank' : rank,
        'perturbation' : delta_rgb,
        'True_class' : True_class,
        'class_threshold' : None,
        'image_name' : image_name,
        'input_name' : 'input'
    }
    
    
    provide = Reachability_provider(
        de = torch.tensor(de/std_vals).to(device),
        device = device,
        model = ort_session,
        Cent = Cent,
        original_dim = (3, 720, 960),
        output_dim = output_dim,
        mode = surrogate_mode,
        radii_mode = "L2",
        params = params
        )
    
    params.update({
    'gb_workers': 112,          # number of CPU workers (processes)
    'gb_threads': 1,            # threads per Gurobi model (keep small when many workers)
    'gb_presolve': 2,
    'gb_method': 1,
    'gb_opt_tol': 1e-9,
    'gb_feas_tol': 1e-9,

    # batch sizing knobs (optional)
    # 'gb_inner_batch': 16,      # hard override if you want a fixed size
    'gb_tasks_per_worker': 4,   # auto: at least 4 LPs queued per worker
    'gb_inner_batch_min': 4,    # don’t go below this
    'gb_inner_batch_max': 64,   # keep LPs small; 32–64 works well
    'gb_cap_by_ndir': True,     # also bound by N_dir // 2 for safety
    })
    
    provide.Provider()




def Camvid_exp2( projection_batch, guarantee, device, src_dir, nnv_dir ):
    
    params = {
        'projection_batch' : projection_batch,
        'guarantee': guarantee,
    }
    
    Segment = Segmentor(
        device = device,
        src_dir = src_dir,
        nnv_dir = nnv_dir,
        params = params
        )

    Segment.Mask_titles()





if __name__ == '__main__':
    
    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
    Ns = 8000
    Nsp =  150
    rank = 7999
    guarantee = 0.999
    Nt = 2100
    N_dir = 150
    threshold_normal = 1e-5
    sim_batch = 5
    trn_batch = 10
    surrogate_mode = 'CLP'
    src_dir = None
    nnv_dir = None
    projection_batch = 720*960
    


    image_names = [
        '0001TP_008790.png',
        '0001TP_010110.png',
        '0001TP_010290.png',
        '0006R0_f02190.png',
        'Seq05VD_f00000.png',
        'Seq05VD_f00090.png'
        # 'Seq05VD_f01320.png',
        # 'Seq05VD_f01410.png',
        # 'Seq05VD_f02070.png',
        # 'Seq05VD_f03540.png'
        ]

    
    delta_rgb_list = [50, 100, 150] 
    

    for idx, image_name in enumerate(image_names):
        for delta_rgb in delta_rgb_list:
            
            print(f"Running: {image_name} with N_perturbed = ALL")
            
            
            Camvid_exp1( delta_rgb,  Nt, N_dir, image_name,
                           Ns, Nsp, rank, device,  threshold_normal,
                           sim_batch, trn_batch, surrogate_mode)
            
            
            Camvid_exp2( projection_batch, guarantee, device, src_dir, nnv_dir )
            
            gc.collect()
            torch.cuda.empty_cache()
            