import torch
import torch.nn as nn
import torch.nn.functional as F
import math

model_urls = {
    "resnet18": "https://s3.amazonaws.com/pytorch/models/resnet18-5c106cde.pth",
    "resnet34": "https://s3.amazonaws.com/pytorch/models/resnet34-333f7ec4.pth",
    "resnet50": "https://s3.amazonaws.com/pytorch/models/resnet50-19c8e357.pth",
    "resnet101": "https://s3.amazonaws.com/pytorch/models/resnet101-5d3b4d8f.pth",
    "resnet152": "https://s3.amazonaws.com/pytorch/models/resnet152-b121ed2d.pth",
}


class BasicBlock(nn.Module):
    expansion = 1

    def __init__(self, inplanes, planes, stride=1):
        super(BasicBlock, self).__init__()
        self.conv1 = nn.Conv2d(
            inplanes, planes, kernel_size=3, padding=1, bias=False, stride=stride
        )
        self.bn1 = nn.BatchNorm2d(planes)
        self.relu = nn.ReLU(inplace=True)
        self.conv2 = nn.Conv2d(
            planes, planes, kernel_size=3, padding=1, bias=False, stride=1
        )
        self.bn2 = nn.BatchNorm2d(planes)
        # self.downsample = downsample
        if stride != 1 or self.expansion * planes != inplanes:
            self.downsample = nn.Sequential(
                nn.Conv2d(
                    inplanes,
                    self.expansion * planes,
                    kernel_size=1,
                    stride=stride,
                    bias=False,
                ),
                nn.BatchNorm2d(self.expansion * planes),
            )
        else:
            self.downsample = None

    def forward(self, x):
        identity = x

        out = self.conv1(x)
        out = self.bn1(out)
        out = self.relu(out)

        out = self.conv2(out)
        out = self.bn2(out)

        if self.downsample is not None:
            identity = self.downsample(x)

        out += identity
        out = self.relu(out)

        return out


class BottleNeck(nn.Module):
    expansion = 4

    def __init__(self, inplanes, planes, stride=1):
        super(BottleNeck, self).__init__()
        self.conv1 = nn.Conv2d(inplanes, planes, kernel_size=1, bias=False)
        self.bn1 = nn.BatchNorm2d(planes)
        self.relu1 = nn.ReLU(True)
        self.conv2 = nn.Conv2d(
            planes, planes, kernel_size=3, stride=stride, padding=1, bias=False
        )
        self.bn2 = nn.BatchNorm2d(planes)
        self.relu2 = nn.ReLU(True)
        self.conv3 = nn.Conv2d(
            planes, planes * self.expansion, kernel_size=1, bias=False
        )
        self.bn3 = nn.BatchNorm2d(planes * self.expansion)
        if stride != 1 or self.expansion * planes != inplanes:
            self.downsample = nn.Sequential(
                nn.Conv2d(
                    inplanes,
                    self.expansion * planes,
                    kernel_size=1,
                    stride=stride,
                    bias=False,
                ),
                nn.BatchNorm2d(self.expansion * planes),
            )
        else:
            self.downsample = None
        self.relu = nn.ReLU(True)

    def forward(self, x):
        out = self.relu1(self.bn1(self.conv1(x)))

        out = self.relu2(self.bn2(self.conv2(out)))

        out = self.bn3(self.conv3(out))

        if self.downsample != None:
            residual = self.downsample(x)
        else:
            residual = x
        out = out + residual
        out = self.relu(out)
        return out


class ResNet(nn.Module):
    def __init__(
            self,
            cfg,
            block_type,
            num_blocks,
            last_layer_stride=2,
    ):
        super(ResNet, self).__init__()
        self.inplanes = 64
        self.block = block_type
        self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3, bias=False)
        self.bn1 = nn.BatchNorm2d(64)
        self.relu = nn.ReLU(True)
        self.pool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)

        self.layer1 = self._make_layer(num_blocks[0], 64)
        self.layer2 = self._make_layer(
            num_blocks[1], 128, stride=2
        )
        self.layer3 = self._make_layer(
            num_blocks[2], 256, stride=2
        )
        self.layer4 = self._make_layer(
            num_blocks[3],
            512,
            stride=last_layer_stride,
        )

    def load_model(self, pretrain):
        print("Loading Backbone pretrain model from {}......".format(pretrain))
        model_dict = self.state_dict()
        pretrain_dict = torch.load(pretrain)
        pretrain_dict = pretrain_dict["state_dict"] if "state_dict" in pretrain_dict else pretrain_dict
        from collections import OrderedDict

        new_dict = OrderedDict()
        for k, v in pretrain_dict.items():
            if k.startswith("module"):
                k = k[7:]
            if "fc" not in k and "classifier" not in k:
                k = k.replace("backbone.", "")
                new_dict[k] = v

        model_dict.update(new_dict)
        self.load_state_dict(model_dict)
        print("Backbone model has been loaded......")

    def _make_layer(self, num_block, planes, stride=1):
        strides = [stride] + [1] * (num_block - 1)
        layers = []
        for now_stride in strides:
            layers.append(
                self.block(
                    self.inplanes, planes, stride=now_stride
                )
            )
            self.inplanes = planes * self.block.expansion
        return nn.Sequential(*layers)

    def forward(self, x):
        out = self.conv1(x)
        out = self.bn1(out)
        out = self.relu(out)
        out = self.pool(out)

        out = self.layer1(out)
        out = self.layer2(out)
        out = self.layer3(out)
        out = self.layer4(out)

        return out


class ResNet_2(nn.Module):
    def __init__(self, block, layers, rate=1, inter_layer=False):
        super(ResNet_2, self).__init__()
        self.inter_layer = inter_layer
        self.in_channels = int(64 * rate)
        self.conv1 = nn.Sequential(
            nn.Conv2d(3, int(64 * rate), kernel_size=3, padding=1, bias=False),
            nn.BatchNorm2d(int(64 * rate)), nn.ReLU(inplace=True))

        self.stage2 = self._make_layer(block, int(64 * rate), layers[0], 1)
        self.stage3 = self._make_layer(block, int(128 * rate), layers[1], 2)
        self.stage4 = self._make_layer(block, int(256 * rate), layers[2], 2)
        self.stage5 = self._make_layer(block, int(512 * rate), layers[3], 2)

    def _make_layer(self, block, out_channels, num_blocks, stride):
        """make resnet layers(by layer i didnt mean this 'layer' was the
        same as a neuron netowork layer, ex. conv layer), one layer may
        contain more than one residual block
        Args:
            block: block type, basic block or bottle neck block
            out_channels: output depth channel number of this layer
            num_blocks: how many blocks per layer
            stride: the stride of the first block of this layer

        Return:
            return a resnet layer
        """

        strides = [stride] + [1] * (num_blocks - 1)
        layers = []
        for stride in strides:
            layers.append(block(self.in_channels, out_channels, stride))
            self.in_channels = out_channels * block.expansion

        return nn.Sequential(*layers)

    def forward(self, x):
        x = self.conv1(x)
        x = self.stage2(x)
        x = self.stage3(x)
        x = self.stage4(x)
        x = self.stage5(x)
        return x


class BBN_ResNet(nn.Module):
    def __init__(
            self,
            cfg,
            block_type,
            num_blocks,
            last_layer_stride=2,
    ):
        super(BBN_ResNet, self).__init__()
        self.inplanes = 64
        self.block = block_type

        self.conv1 = nn.Conv2d(3, 64, kernel_size=7, stride=2, padding=3, bias=False)
        self.bn1 = nn.BatchNorm2d(64)
        self.relu = nn.ReLU(True)
        self.pool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)

        self.layer1 = self._make_layer(num_blocks[0], 64)
        self.layer2 = self._make_layer(num_blocks[1], 128, stride=2)
        self.layer3 = self._make_layer(num_blocks[2], 256, stride=2)
        self.layer4 = self._make_layer(num_blocks[3] - 1, 512, stride=last_layer_stride)

        self.cb_block = self.block(self.inplanes, self.inplanes // 4, stride=1)
        self.rb_block = self.block(self.inplanes, self.inplanes // 4, stride=1)

    def load_model(self, pretrain):
        print("Loading Backbone pretrain model from {}......".format(pretrain))
        model_dict = self.state_dict()
        pretrain_dict = torch.load(pretrain)
        pretrain_dict = pretrain_dict["state_dict"] if "state_dict" in pretrain_dict else pretrain_dict
        from collections import OrderedDict

        new_dict = OrderedDict()
        for k, v in pretrain_dict.items():
            if k.startswith("module"):
                k = k[7:]
            if "fc" not in k and "classifier" not in k:
                k = k.replace("backbone.", "")
                new_dict[k] = v

        model_dict.update(new_dict)
        self.load_state_dict(model_dict)
        print("Backbone model has been loaded......")

    def _make_layer(self, num_block, planes, stride=1):
        strides = [stride] + [1] * (num_block - 1)
        layers = []
        for now_stride in strides:
            layers.append(self.block(self.inplanes, planes, stride=now_stride))
            self.inplanes = planes * self.block.expansion
        return nn.Sequential(*layers)

    def forward(self, x, **kwargs):
        out = self.conv1(x)
        out = self.bn1(out)
        out = self.relu(out)
        out = self.pool(out)

        out = self.layer1(out)
        out = self.layer2(out)
        out = self.layer3(out)
        out = self.layer4(out)

        if "feature_cb" in kwargs:
            out = self.cb_block(out)
            return out
        elif "feature_rb" in kwargs:
            out = self.rb_block(out)
            return out
        out1 = self.cb_block(out)
        out2 = self.rb_block(out)
        out = torch.cat((out1, out2), dim=1)

        return out


def res10(
        cfg,
        pretrain=True,
        pretrained_backbone="~/.cache/torch/checkpoints/resnet18-5c106cde.pth",
        last_layer_stride=2,
):
    print("Using ResNet10........")
    resnet = ResNet(
        cfg,
        BasicBlock,
        [1, 1, 1, 1],
        last_layer_stride=last_layer_stride,
    )
    if pretrain and pretrained_backbone != "":
        resnet.load_model(pretrain=pretrained_backbone)
    else:
        print("Choose to train from scratch")
    return resnet


def res18(
        cfg,
        pretrain=True,
        pretrained_backbone="~/.cache/torch/checkpoints/resnet18-5c106cde.pth",
        last_layer_stride=2,
):
    print("Using ResNet18........")
    resnet = ResNet(
        cfg,
        BasicBlock,
        [2, 2, 2, 2],
        last_layer_stride=last_layer_stride,
    )
    if pretrain and pretrained_backbone != "":
        resnet.load_model(pretrain=pretrained_backbone)
    else:
        print("Choose to train from scratch")
    return resnet


def res32_512(cfg,
            pretrain,
            pretrained_backbone,
            last_layer_stride=2,):
    print("Using ResNet32, feature dim=512........")
    resnet = ResNet_2(
       BasicBlock, [3, 4, 6, 3]
    )
    return resnet


def res50(
        cfg,
        pretrain=True,
        pretrained_backbone="/data/Data/pretrain_models/resnet50-19c8e357.pth",
        last_layer_stride=2,
):
    print("Using ResNet50........")
    resnet = ResNet(
        cfg,
        BottleNeck,
        [3, 4, 6, 3],
        last_layer_stride=last_layer_stride,
    )
    if pretrain and pretrained_backbone != "":
        resnet.load_model(pretrain=pretrained_backbone)
    else:
        print("Choose to train from scratch")
    return resnet


def res101(
        cfg,
        pretrain=True,
        pretrained_backbone="/data/Data/pretrain_models/resnet101-5d3b4d8f.pth",
        last_layer_stride=2,
):
    print("Using ResNet101........")
    resnet = ResNet(
        cfg,
        BottleNeck,
        [3, 4, 23, 3],
        last_layer_stride=last_layer_stride,
    )
    if pretrain and pretrained_backbone != "":
        resnet.load_model(pretrain=pretrained_backbone)
    else:
        print("Choose to train from scratch")
    return resnet


def res152(
        cfg,
        pretrain=True,
        pretrained_backbone="~/.cache/torch/checkpoints/resnet152-b121ed2d.pth",
        last_layer_stride=2,
):
    print("Using ResNet152........")
    resnet = ResNet(
        cfg,
        BottleNeck,
        [3, 8, 36, 3],
        last_layer_stride=last_layer_stride,
    )
    if pretrain and pretrained_backbone != "":
        resnet.load_model(pretrain=pretrained_backbone)
    else:
        print("Choose to train from scratch")
    return resnet


def bbn_res50(
        cfg,
        pretrain=True,
        pretrained_backbone="/data/Data/pretrain_models/resnet50-19c8e357.pth",
        last_layer_stride=2,
):
    print("Using BBN_ResNet50........")
    resnet = BBN_ResNet(
        cfg,
        BottleNeck,
        [3, 4, 6, 3],
        last_layer_stride=last_layer_stride,
    )
    if pretrain and pretrained_backbone != "":
        resnet.load_model(pretrain=pretrained_backbone)
    else:
        print("Choose to train from scratch")
    return resnet
