Source code for machin.model.nets.resnet

import torch as t
import numpy as np
import torch.nn as nn
from torch.nn.utils.weight_norm import weight_norm

from .base import NeuralNetworkModule


def conv1x1(in_planes, out_planes, stride=1):
    """
    Create a 1x1 2d convolution block
    """
    return nn.Conv2d(in_planes, out_planes, kernel_size=1, stride=stride, bias=False)


def conv3x3(in_planes, out_planes, stride=1):
    """
    Create a 3x3 2d convolution block
    """
    return nn.Conv2d(
        in_planes, out_planes, kernel_size=3, stride=stride, padding=1, bias=False
    )


def conv5x5(in_planes, out_planes, stride=2):
    """
    Create a 5x5 2d convolution block
    """
    return nn.Conv2d(
        in_planes, out_planes, kernel_size=5, stride=stride, padding=2, bias=False
    )


def none_norm(*_, **__):
    return nn.Sequential()


def cfg(depth, norm="none"):
    depth_lst = [18, 34, 50, 101, 152]
    if depth not in depth_lst:
        raise ValueError(
            "Error : Resnet depth should be either " "18, 34, 50, 101, 152"
        )
    if norm == "batch":
        cfg_dict = {
            "18": (BasicBlock, [2, 2, 2, 2], {}),
            "34": (BasicBlock, [3, 4, 6, 3], {}),
            "50": (Bottleneck, [3, 4, 6, 3], {}),
            "101": (Bottleneck, [3, 4, 23, 3], {}),
            "152": (Bottleneck, [3, 8, 36, 3], {}),
        }
    elif norm == "weight":
        cfg_dict = {
            "18": (BasicBlockWN, [2, 2, 2, 2], {}),
            "34": (BasicBlockWN, [3, 4, 6, 3], {}),
            "50": (BottleneckWN, [3, 4, 6, 3], {}),
            "101": (BottleneckWN, [3, 4, 23, 3], {}),
            "152": (BottleneckWN, [3, 8, 36, 3], {}),
        }
    elif norm == "none":
        cfg_dict = {
            "18": (BasicBlock, [2, 2, 2, 2], {"norm_layer": none_norm}),
            "34": (BasicBlock, [3, 4, 6, 3], {"norm_layer": none_norm}),
            "50": (Bottleneck, [3, 4, 6, 3], {"norm_layer": none_norm}),
            "101": (Bottleneck, [3, 4, 23, 3], {"norm_layer": none_norm}),
            "152": (Bottleneck, [3, 8, 36, 3], {"norm_layer": none_norm}),
        }
    else:
        raise ValueError(f'Invalid normalization method: "{norm}"')
    return cfg_dict[str(depth)]


class BasicBlock(NeuralNetworkModule):
    # Expansion parameter, output will have "expansion * in_planes" depth.
    expansion = 1

    def __init__(self, in_planes, out_planes, stride=1, norm_layer=None, **__):
        """
        Create a basic block of resnet.

        Args:
            in_planes:  Number of input planes.
            out_planes: Number of output planes.
            stride:     Stride of convolution.
        """
        if norm_layer is None:
            norm_layer = nn.BatchNorm2d
        super().__init__()
        self.conv1 = conv3x3(in_planes, out_planes, stride)
        self.bn1 = norm_layer(out_planes)
        self.conv2 = conv3x3(out_planes, self.expansion * out_planes)
        self.bn2 = norm_layer(self.expansion * out_planes)
        # Create a shortcut from input to output.
        # An empty sequential structure means no transformation
        # is made on input X.
        self.shortcut = nn.Sequential()

        self.set_input_module(self.conv1)

        # A convolution is needed if we cannot directly add input X to output
        # BatchNorm2d produces NaN gradient?
        if stride != 1 or in_planes != self.expansion * out_planes:
            self.shortcut = nn.Sequential(
                conv1x1(in_planes, self.expansion * out_planes, stride),
                norm_layer(self.expansion * out_planes),
            )

    def forward(self, x):
        out = t.relu(self.bn1(self.conv1(x)))
        out = self.bn2(self.conv2(out))
        out += self.shortcut(x)
        out = t.relu(out)
        return out


class Bottleneck(NeuralNetworkModule):
    # Expansion parameter, output will have "expansion * in_planes" depth.
    expansion = 4

    def __init__(self, in_planes, out_planes, stride=1, norm_layer=None, **__):
        """
        Create a bottleneck block of resnet.

        Args:
            in_planes:  Number of input planes.
            out_planes: Number of output planes.
            stride:     Stride of convolution.
        """
        if norm_layer is None:
            norm_layer = nn.BatchNorm2d
        super().__init__()
        self.conv1 = conv1x1(in_planes, out_planes)
        self.conv2 = conv3x3(out_planes, out_planes, stride=stride)
        self.conv3 = conv1x1(out_planes, self.expansion * out_planes)
        self.bn1 = norm_layer(out_planes)
        self.bn2 = norm_layer(out_planes)
        self.bn3 = norm_layer(self.expansion * out_planes)

        self.shortcut = nn.Sequential()

        self.set_input_module(self.conv1)

        if stride != 1 or in_planes != self.expansion * out_planes:
            self.shortcut = nn.Sequential(
                conv1x1(in_planes, self.expansion * out_planes, stride),
                norm_layer(self.expansion * out_planes),
            )

    def forward(self, x):
        out = t.relu(self.bn1(self.conv1(x)))
        out = t.relu(self.bn2(self.conv2(out)))
        out = self.bn3(self.conv3(out))
        out += self.shortcut(x)
        out = t.relu(out)
        return out


class BasicBlockWN(NeuralNetworkModule):
    """
    Basic block with weight normalization
    """

    # Expansion parameter, output will have "expansion * in_planes" depth.
    expansion = 1

    def __init__(self, in_planes, out_planes, stride=1, **__):
        """
        Create a basic block of resnet.

        Args:
            in_planes:  Number of input planes.
            out_planes: Number of output planes.
            stride:     Stride of convolution.
        """
        super().__init__()
        self.conv1 = weight_norm(conv3x3(in_planes, out_planes, stride))
        self.conv2 = weight_norm(conv3x3(out_planes, self.expansion * out_planes))
        # Create a shortcut from input to output.
        # An empty sequential structure means no transformation
        # is made on input X.
        self.shortcut = nn.Sequential()

        self.set_input_module(self.conv1)

        # A convolution is needed if we cannot directly add input X to output.
        if stride != 1 or in_planes != self.expansion * out_planes:
            self.shortcut = nn.Sequential(
                weight_norm(conv1x1(in_planes, self.expansion * out_planes, stride)),
            )

    def forward(self, x):
        out = t.relu(self.conv1(x))
        out = self.conv2(out)
        out += self.shortcut(x)
        out = t.relu(out)
        return out


class BottleneckWN(NeuralNetworkModule):
    """
    Bottleneck block with weight normalization
    """

    # expansion parameter, output will have "expansion * in_planes" depth
    expansion = 4

    def __init__(self, in_planes, out_planes, stride=1, **__):
        """
        Create a bottleneck block of resnet.

        Args:
            in_planes:  Number of input planes.
            out_planes: Number of output planes.
            stride:     Stride of convolution.
        """
        super().__init__()
        self.conv1 = weight_norm(
            nn.Conv2d(in_planes, out_planes, kernel_size=1, bias=False)
        )
        self.conv2 = weight_norm(
            nn.Conv2d(
                out_planes,
                out_planes,
                kernel_size=3,
                stride=stride,
                padding=1,
                bias=False,
            )
        )
        self.conv3 = weight_norm(
            nn.Conv2d(
                out_planes, self.expansion * out_planes, kernel_size=1, bias=False
            )
        )

        self.shortcut = nn.Sequential()

        self.set_input_module(self.conv1)

        if stride != 1 or in_planes != self.expansion * out_planes:
            self.shortcut = nn.Sequential(
                weight_norm(conv1x1(in_planes, self.expansion * out_planes, stride)),
            )

    def forward(self, x):
        out = t.relu(self.conv1(x))
        out = t.relu(self.conv2(out))
        out = self.conv3(out)
        out += self.shortcut(x)
        out = t.relu(out)

        return out


[docs]class ResNet(NeuralNetworkModule):
    def __init__(
        self,
        in_planes: int,
        depth: int,
        out_planes: int,
        out_pool_size=(1, 1),
        norm="none",
    ):
        """
        Create a resnet of specified depth.

        Args:
            in_planes:  Number of input planes.
            depth: Depth of resnet. Could be one of ``18, 34, 50, 101, 152``.
            out_planes: Number of output planes.
            out_pool_size: Size of pooling output
            norm: Normalization method, could be one of "none", "batch" or
                "weight".
        """
        super().__init__()
        self.norm = norm
        self.depth = depth
        self.in_planes = in_planes
        self.out_planes = out_planes
        self.out_pool_size = out_pool_size

        self._cur_in_planes = 64

        block, num_blocks, kw = cfg(depth, norm)

        self.conv1 = nn.Conv2d(
            in_planes, 64, kernel_size=7, stride=2, padding=3, bias=False
        )
        self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)
        if norm == "batch":
            self.bn1 = nn.BatchNorm2d(64)
            self.layer1 = self._make_layer(block, 64, num_blocks[0], 1, kw)
            self.layer2 = self._make_layer(block, 128, num_blocks[1], 2, kw)
            self.layer3 = self._make_layer(block, 256, num_blocks[2], 2, kw)
            self.layer4 = self._make_layer(block, 512, num_blocks[3], 2, kw)
            self.base = nn.Sequential(
                self.conv1,
                self.bn1,
                nn.ReLU(),
                self.maxpool,
                self.layer1,
                self.layer2,
                self.layer3,
                self.layer4,
            )
        else:
            self.layer1 = self._make_layer(block, 64, num_blocks[0], 1, kw)
            self.layer2 = self._make_layer(block, 128, num_blocks[1], 2, kw)
            self.layer3 = self._make_layer(block, 256, num_blocks[2], 2, kw)
            self.layer4 = self._make_layer(block, 512, num_blocks[3], 2, kw)
            self.base = nn.Sequential(
                self.conv1,
                nn.ReLU(),
                self.maxpool,
                self.layer1,
                self.layer2,
                self.layer3,
                self.layer4,
            )
        self.fc = nn.Linear(512 * out_pool_size[0] * out_pool_size[1], out_planes)

        self.set_input_module(self.conv1)

    def _make_layer(self, block, planes, num_blocks, stride, kwargs):
        strides = [stride] + [1] * (num_blocks - 1)
        layers = []

        for stride in strides:
            layers.append(block(self._cur_in_planes, planes, stride, **kwargs))
            self._cur_in_planes = planes * block.expansion

        return nn.Sequential(*layers)

[docs]    def forward(self, x):
        assert x.shape[2] == 224 and x.shape[3] == 224
        x = self.base(x)
        kernel_size = (
            np.int(np.floor(x.size(2) / self.out_pool_size[0])),
            np.int(np.floor(x.size(3) / self.out_pool_size[1])),
        )
        x = nn.functional.avg_pool2d(x, kernel_size)
        x = x.view(x.size(0), -1)
        x = self.fc(x)
        return x