import numpy as np
import torch
import torch.nn as nn
import torch.nn.functional as F
from time import time


def skew_matrix(vector3d):
    batch_size = vector3d.size(0)
    s = torch.zeros((batch_size, 3, 3), dtype=vector3d.dtype, device=vector3d.device)
    s[:, 0, 1] = - vector3d[:, 2]
    s[:, 0, 2] = vector3d[:, 1]
    s[:, 1, 0] = vector3d[:, 2]
    s[:, 1, 2] = - vector3d[:, 0]
    s[:, 2, 0] = - vector3d[:, 1]
    s[:, 2, 1] = vector3d[:, 0]
    return s


def compute_Fmatrix(cam_params1, cam_params2):
    intr1, extr1 = cam_params1[:, 1, :3, :3], cam_params1[:, 0, :3, :4]
    intr2, extr2 = cam_params2[:, 1, :3, :3], cam_params2[:, 0, :3, :4]

    rot1, trans1 = extr1[:, :3, :3], extr1[:, :3, [3]]
    rot2, trans2 = extr2[:, :3, :3], extr2[:, :3, [3]]
    cam_center1 = - torch.inverse(rot1) @ trans1
    # cam_center1 = torch.cat((cam_center1, torch.ones_like(cam_center1[:, [0], :])), dim=1)
    cam_center2 = - torch.inverse(rot2) @ trans2

    proj1 = torch.matmul(intr1, rot1)
    proj2 = torch.matmul(intr2, rot2)
    # print(proj2.size(), cam_center1.size())
    cam_center12 = torch.matmul(proj2, cam_center1 - cam_center2)
    # print(cam_center12.size())
    smatrix = skew_matrix(cam_center12.squeeze(2))
    # print(smatrix.size(), proj1.size(), proj2.size())
    Fmatrix = smatrix @ proj2 @ torch.inverse(proj1)

    return Fmatrix


def compute_epipole(Fmatrix):
    c = 1e3
    eq1 = c * Fmatrix[:, 0] + Fmatrix[:, 1] + Fmatrix[:, 2] # [B, 3]
    eq2 = c * Fmatrix[:, 0] - Fmatrix[:, 1] - Fmatrix[:, 2] # [B, 3]
    eq = torch.stack((eq1, eq2), dim=1) # [B, 2, 3]
    epipole = - torch.inverse(eq[:, :, :2]) @ eq[:, :, [2]] # [B, 2, 1]
    return epipole.squeeze(2)


def dGauss(img, kernel_size):
    in_channels = img.shape[1]
    sigma = float(1.2 * kernel_size / 9)
    y, x = torch.meshgrid([torch.arange(-(kernel_size - 1) // 2, (kernel_size - 1) // 2 + 1, dtype=torch.float32, device=img.device),
                           torch.arange(-(kernel_size - 1) // 2, (kernel_size - 1) // 2 + 1, dtype=torch.float32, device=img.device)])
    gauss_kernel = torch.exp(- (x ** 2 + y ** 2) / (2 * sigma ** 2)) / (2 * np.pi * sigma ** 2)

    gx = -x / (sigma ** 2) * gauss_kernel
    gy = -y / (sigma ** 2) * gauss_kernel
    gxx = (x ** 2 - sigma ** 2) / (sigma ** 4) * gauss_kernel # normalize
    gxx -= gxx.sum(dim=1, keepdims=True) / kernel_size 
    gxy = x * y / (sigma ** 4) * gauss_kernel
    gyy = (y ** 2 - sigma ** 2) / (sigma ** 4) * gauss_kernel
    gyy -= gyy.sum(dim=0, keepdims=True) / kernel_size # normalize
    weight = torch.stack((gx, gy, gxx, gxy, gyy))
    weight = weight.unsqueeze(1).repeat(1, in_channels, 1, 1) / in_channels
    filtered_results = F.conv2d(img, weight, None, 1, (kernel_size-1)//2, 1, 1)
    dx, dy, dxx, dxy, dyy = torch.unbind(filtered_results, dim=1)
    return dx.unsqueeze(1), dy.unsqueeze(1), dxx.unsqueeze(1), dxy.unsqueeze(1), dyy.unsqueeze(1)


class DynamicConv(nn.Module):
    def __init__(self, in_c, out_c, size_kernels=(3, 5, 7), stride=1, bias=True, thresh_curv=0.01, **kwargs):
        super(DynamicConv, self).__init__()
        self.size_kernels = size_kernels
        self.thresh_curv = thresh_curv
        self.auto_selection = kwargs.get("auto_selection", False)
        self.convs = nn.ModuleList([nn.Conv2d(in_c, out_c, k, padding=(k-1)//2, stride=stride, bias=bias) for k in self.size_kernels])
        if self.auto_selection:
            hidden_dim = kwargs.get("hidden_dim", 4)
            self.att_weights = nn.Sequential(nn.Conv2d(len(size_kernels), hidden_dim, 1, bias=False),
                                             nn.BatchNorm2d(hidden_dim),
                                             nn.ReLU(inplace=True),
                                             nn.Conv2d(hidden_dim, len(size_kernels), 1, bias=False))

    def forward(self, feature_vol, epipole=None, temperature=0.001):
        batch_size, height, width = feature_vol.shape[0], feature_vol.shape[2], feature_vol.shape[3]
        y, x = torch.meshgrid([torch.arange(0, height, dtype=torch.float32, device=feature_vol.device),
                               torch.arange(0, width, dtype=torch.float32, device=feature_vol.device)])
        x, y = x.contiguous(), y.contiguous()
        epipole_map = epipole.unsqueeze(-1).unsqueeze(-1) # [B, 2, 1, 1]
        u = x.unsqueeze(0).unsqueeze(0) - epipole_map[:, [0], :, :] # [B, 1, H, W]
        v = y.unsqueeze(0).unsqueeze(0) - epipole_map[:, [1], :, :] # [B, 1, H, W]
        normed_uv = torch.sqrt(u**2 + v**2)
        u, v = u / (normed_uv + 1e-6), v / (normed_uv + 1e-6)

        curvs = []
        results = []
        for idx, s in enumerate(self.size_kernels):
            dx, dy, dxx, dxy, dyy = dGauss(feature_vol.detach(), s)
            num = (torch.cat((dxx, dxy, dyy), dim=1) * torch.cat((u**2, 2*u*v, v**2), dim=1)).sum(dim=1, keepdim=True)
            den = torch.sqrt(1 + dx**2 + dy**2) * (1 + (u*dx + v*dy)**2)
            curv = num / den
            curvs.append(curv) #.unsqueeze(1))
            results.append(self.convs[idx](feature_vol).unsqueeze(1))
        curvs = torch.cat(curvs, dim=1) # [B, num_kernels, H, W]
        results = torch.cat(results, dim=1)
        if self.auto_selection:
            weights = self.att_weights(curvs)
            weights = F.softmax(weights / temperature, dim=1)
            filtered_result = (results * weights.unsqueeze(2)).sum(dim=1)
            est_curv = (curvs * weights).sum(dim=1, keepdim=True)
        else:
            indices = torch.argmin((curvs - self.thresh_curv).abs(), dim=1, keepdim=True)
            est_curv = torch.gather(curvs, 1, indices)
            filtered_result = torch.gather(results, 1, indices.unsqueeze(2).repeat(1, 1, results.shape[2], 1, 1))
            filtered_result = filtered_result.squeeze(1)
        return filtered_result, est_curv


"""class DynamicConv(nn.Module):
    def __init__(self, in_c, out_c, size_kernels=(3, 5, 7), stride=1, bias=True, thresh_scale=0.01, **kwargs):
        super(DynamicConv, self).__init__()
        self.size_kernels = size_kernels
        self.thresh_scale = thresh_scale
        self.att_convs = nn.ModuleList([nn.Conv2d(in_c, 3, k, padding=(k-1)//2, bias=False) for k in size_kernels])
        self.convs = nn.ModuleList([nn.Conv2d(in_c, out_c, k, padding=(k-1)//2, stride=stride, bias=bias) for k in self.size_kernels])
        hidden_dim = kwargs.get("hidden_dim", 4)
        self.att_weights = nn.Sequential(nn.Conv2d(len(size_kernels), hidden_dim, 1, bias=False),
                                         nn.BatchNorm2d(hidden_dim),
                                         nn.ReLU(inplace=True),
                                         nn.Conv2d(hidden_dim, len(size_kernels), 1, bias=False))
        # att_weights = []
        # for k in size_kernels:
        #     att_weights.append(nn.Sequential(nn.Conv2d(in_c, hidden_dim, k, padding=(k-1)//2, bias=False),
        #                                      nn.ReLU(inplace=True),
        #                                      nn.Conv2d(hidden_dim, 1, 1, bias=True)))
        # self.att_weights = nn.ModuleList(att_weights)
        # self.temperature = kwargs.get("temperature", 0.001)

        for p in self.att_convs.parameters():
            torch.nn.init.normal_(p, std=0.1)

    def forward(self, feature_vol, epipole=None, temperature=0.001):
        # surface = feature_vol.mean(dim=1, keepdim=True)
        batch_size, height, width = feature_vol.shape[0], feature_vol.shape[2], feature_vol.shape[3]
        y, x = torch.meshgrid([torch.arange(0, height, dtype=torch.float32, device=feature_vol.device),
                               torch.arange(0, width, dtype=torch.float32, device=feature_vol.device)])
        x, y = x.contiguous(), y.contiguous()
        epipole_map = epipole.unsqueeze(-1).unsqueeze(-1) # [B, 2, 1, 1]
        u = x.unsqueeze(0).unsqueeze(0) - epipole_map[:, [0], :, :] # [B, 1, H, W]
        v = y.unsqueeze(0).unsqueeze(0) - epipole_map[:, [1], :, :] # [B, 1, H, W]
        normed_uv = torch.sqrt(u**2 + v**2)
        u, v = u / (normed_uv + 1e-6), v / (normed_uv + 1e-6)

        curvs = []
        results = []
        for idx, s in enumerate(self.size_kernels):
            curv = self.att_convs[idx](feature_vol)
            curv = (curv * torch.cat((u**2, 2*u*v, v**2), dim=1)).sum(dim=1, keepdim=True)
            # w = self.att_weights[idx](feature_vol)
            curvs.append(curv) #.unsqueeze(1))
            results.append(self.convs[idx](feature_vol).unsqueeze(1))
        curvs = torch.cat(curvs, dim=1) # [B, num_kernels, H, W]
        weights = self.att_weights(curvs)
        weights = F.softmax(weights / temperature, dim=1)
        filtered_result = (torch.cat(results, dim=1) * weights.unsqueeze(2)).sum(dim=1)
        norm_curv = (curvs * weights).sum(dim=1, keepdim=True)
        return filtered_result, norm_curv #, sum_mask, t11, t12, t13"""


def read_cam_file(filename, interval_scale=1.0):
    with open(filename) as f:
        lines = f.readlines()
        lines = [line.rstrip() for line in lines]
    # extrinsics: line [1,5), 4x4 matrix
    extrinsics = np.fromstring(' '.join(lines[1:5]), dtype=np.float32, sep=' ').reshape((4, 4))
    # intrinsics: line [7-10), 3x3 matrix
    intrinsics = np.fromstring(' '.join(lines[7:10]), dtype=np.float32, sep=' ').reshape((3, 3))
    intrinsics[:2, :] /= 4.0
    # depth_min & depth_interval: line 11
    depth_min = float(lines[11].split()[0])
    depth_interval = float(lines[11].split()[1])

    if len(lines[11].split()) >= 3:
        num_depth = lines[11].split()[2]
        depth_max = depth_min + int(float(num_depth)) * depth_interval
        depth_interval = (depth_max - depth_min) / 192

    depth_interval *= interval_scale

    return intrinsics, extrinsics, depth_min, depth_interval


if __name__ == '__main__':
    # from PIL import Image
    # from torchvision.transforms import ToTensor
    #
    # ref_img = Image.open(r"D:\lab\dtu\scan4\images\00000000.jpg")
    # ref_img = ToTensor()(ref_img).cuda()
    # src_img = Image.open("D:/lab/dtu/scan4/images/00000010.jpg")
    # src_img = ToTensor()(src_img).cuda()
    #
    # ref_intr, ref_extr, _, _ = read_cam_file("D://lab/dtu/scan4/cams/00000000_cam.txt")
    # src_intr, src_extr, _, _ = read_cam_file("D://lab/dtu/scan4/cams/00000010_cam.txt")
    #
    # ref_cam_params = torch.zeros(1, 2, 4, 4)
    # ref_cam_params[0, 0, :4, :4] = torch.tensor(ref_extr, dtype=torch.float32)
    # ref_cam_params[0, 1, :3, :3] = torch.tensor(ref_intr, dtype=torch.float32)
    # ref_cam_params = ref_cam_params.cuda()
    #
    # src_cam_params = torch.zeros(1, 2, 4, 4)
    # src_cam_params[0, 0, :4, :4] = torch.tensor(src_extr, dtype=torch.float32)
    # src_cam_params[0, 1, :3, :3] = torch.tensor(src_intr, dtype=torch.float32)
    # src_cam_params = src_cam_params.cuda()
    #
    # Fmatrix = compute_Fmatrix(ref_cam_params, src_cam_params)
    # ref_epipole = compute_epipole(Fmatrix)
    # src_epipole = compute_epipole(torch.transpose(Fmatrix, 1, 2))
    # print("reference epipole: ", ref_epipole)
    # print("src epipole: ", src_epipole)
    #
    # # compare with opencv result
    # import cv2
    # np_Fmatrix = Fmatrix[0].cpu().numpy()
    # src_line = cv2.computeCorrespondEpilines(np.zeros((1, 1, 2)), 1, np_Fmatrix)
    # src_line = src_line.reshape(-1, 3)
    # src_point = np.array([0, -src_line[0][2] / src_line[0][1]], dtype=np.float32)
    # ref_line = cv2.computeCorrespondEpilines(src_point.reshape((1, 1, 2)), 2, np_Fmatrix)
    # ref_line = ref_line.reshape(-1, 3)
    # print(ref_line[0][:2])
    #
    # print(ref_epipole / torch.sqrt((ref_epipole**2).sum()))

    # gauss_filter = GaussFilter2d(3, 1, 9, padding=4, device=ref_img.device)
    # filtered_img = gauss_filter(ref_img.unsqueeze(0), filter_type='xx')
    import matplotlib.pyplot as plt
    # import matplotlib
    # cmap = matplotlib.cm.gray
    # plt.imshow(filtered_img.squeeze(0).squeeze(0).cpu().numpy())
    # plt.colorbar()
    # plt.show()
    ref_img = torch.rand(3, 400, 400).float().cuda()
    ref_epipole = torch.rand(1, 2).cuda()
    from time import time
    conv = DynamicConv(3, 1, size_kernels=(3, 5, 7, 9), thresh_scale=0.005)
    conv = conv.to(torch.device('cuda'))
    t1 = time()
    conv_img = conv(ref_img.unsqueeze(0), epipole=ref_epipole)
    t2 = time()
    # conv = nn.Conv2d(3, 1, 7, padding=3).to(torch.device('cuda'))
    # t3 = time()
    # conv_img = conv(ref_img.unsqueeze(0))
    # t4 = time()
    print("Time of Dynamic Conv: ", t2-t1)
    # print("Time of original Conv: ", t4-t3)
    # plt.imshow(mask.squeeze(0).squeeze(0).cpu().numpy())
    # plt.colorbar()
    # plt.show()






