import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.ao.quantization as tq

# ----------------- 基础模块 -----------------
class DoubleConv(nn.Module):
    def __init__(self, in_channels, out_channels, mid_channels=None):
        super().__init__()
        if not mid_channels:
            mid_channels = out_channels
        self.double_conv = nn.Sequential(
            nn.Conv2d(in_channels, mid_channels, kernel_size=3, padding=1, bias=False),
            nn.BatchNorm2d(mid_channels),
            nn.ReLU(inplace=True),
            nn.Conv2d(mid_channels, out_channels, kernel_size=3, padding=1, bias=False),
            nn.BatchNorm2d(out_channels),
            nn.ReLU(inplace=True)
        )
    def forward(self, x):
        return self.double_conv(x)

class Down(nn.Module):
    def __init__(self, in_channels, out_channels):
        super().__init__()
        self.maxpool_conv = nn.Sequential(
            nn.MaxPool2d(2),
            DoubleConv(in_channels, out_channels)
        )
    def forward(self, x):
        return self.maxpool_conv(x)

class Up(nn.Module):
    def __init__(self, in_channels, out_channels, bilinear=True):
        super().__init__()
        if bilinear:
            self.up = nn.Upsample(scale_factor=2, mode='bilinear', align_corners=True)
            self.conv = DoubleConv(in_channels, out_channels, in_channels // 2)
        else:
            # ConvTranspose2d 也支持，但注意 QAT 时需要 per-tensor qconfig
            self.up = nn.ConvTranspose2d(in_channels, in_channels // 2, kernel_size=2, stride=2, bias=False)
            self.conv = DoubleConv(in_channels, out_channels)

    def forward(self, x1, x2):
        x1 = self.up(x1)
        diffY = x2.size(2) - x1.size(2)
        diffX = x2.size(3) - x1.size(3)
        x1 = F.pad(x1, [diffX // 2, diffX - diffX // 2,
                        diffY // 2, diffY - diffY // 2])
        x = torch.cat([x2, x1], dim=1)
        return self.conv(x)

class OutConv(nn.Module):
    def __init__(self, in_channels, out_channels):
        super().__init__()
        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=1)
    def forward(self, x):
        return self.conv(x)

# ----------------- 量化友好的 UNet -----------------
class QuantizableUNet(nn.Module):
    def __init__(self, n_classes=2, n_channels=4, layer_num=64, bilinear=True):
        super().__init__()
        self.bilinear = bilinear

        self.inc   = DoubleConv(n_channels, layer_num)
        self.down1 = Down(layer_num, layer_num*2)
        self.down2 = Down(layer_num*2, layer_num*4)
        self.down3 = Down(layer_num*4, layer_num*8)
        factor = 2 if bilinear else 1
        self.down4 = Down(layer_num*8, layer_num*16 // factor)

        self.up1 = Up(layer_num*16, layer_num*8 // factor, bilinear)
        self.up2 = Up(layer_num*8,  layer_num*4 // factor, bilinear)
        self.up3 = Up(layer_num*4,  layer_num*2 // factor, bilinear)
        self.up4 = Up(layer_num*2,  layer_num,              bilinear)
        self.outc = OutConv(layer_num, n_classes)

        # 量化相关
        self.quant = tq.QuantStub()
        self.dequant = tq.DeQuantStub()

    def forward(self, x):
        x = self.quant(x)

        x1 = self.inc(x)
        x2 = self.down1(x1)
        x3 = self.down2(x2)
        x4 = self.down3(x3)
        x5 = self.down4(x4)

        x = self.up1(x5, x4)
        x = self.up2(x,  x3)
        x = self.up3(x,  x2)
        x = self.up4(x,  x1)
        logits = self.outc(x)

        logits = self.dequant(logits)
        return logits

    def fuse_model(self):
        """fuse Conv+BN+ReLU"""
        def fuse_seq(seq: nn.Sequential):
            i = 0
            while i + 2 < len(seq):
                if isinstance(seq[i], nn.Conv2d) and \
                   isinstance(seq[i+1], nn.BatchNorm2d) and \
                   isinstance(seq[i+2], nn.ReLU):
                    tq.fuse_modules(seq, [str(i), str(i+1), str(i+2)], inplace=True)
                    i += 3
                else:
                    i += 1

        for m in [
            self.inc.double_conv,
            self.down1.maxpool_conv[1].double_conv,
            self.down2.maxpool_conv[1].double_conv,
            self.down3.maxpool_conv[1].double_conv,
            self.down4.maxpool_conv[1].double_conv,
            self.up1.conv.double_conv,
            self.up2.conv.double_conv,
            self.up3.conv.double_conv,
            self.up4.conv.double_conv,
        ]:
            fuse_seq(m)
