cvm/models/resnet.py

"""Contains definitions for post- and pre-activation forms of ResNet and ResNet-RS models.
Residual networks (ResNets) were proposed in:
[1] Kaiming He, Xiangyu Zhang, Shaoqing Ren, Jian Sun
    Deep Residual Learning for Image Recognition. arXiv:1512.03385
[2] Kaiming He, Xiangyu Zhang, Shaoqing Ren, Jian Sun
    Identity Mappings in Deep Residual Networks. arXiv:1603.05027
[3] Irwan Bello, William Fedus, Xianzhi Du, Ekin D. Cubuk, Aravind Srinivas,
Tsung-Yi Lin, Jonathon Shlens, Barret Zoph
    Revisiting ResNets: Improved Training and Scaling Strategies.
    arXiv:2103.07579
"""
import torch
import torch.nn as nn

from .ops import blocks
from .utils import export, load_from_local_or_url, config
from typing import Any, List, OrderedDict


@export
class ResNet(nn.Module):
    def __init__(
        self,
        in_channels: int = 3,
        num_classes: int = 1000,
        layers: List[int] = [2, 2, 2, 2],
        groups: int = 1,
        width_per_group: int = 64,
        rd_ratio: float = None,
        dropout_rate: float = 0.0,
        drop_path_rate: float = None,
        block: nn.Module = blocks.ResBasicBlockV1,
        thumbnail: bool = False,
        replace_stem_max_pool: bool = False,
        use_resnetc_stem: bool = False,
        use_resnetd_shortcut: bool = False,
        zero_init_last_bn: bool = True,
        dilations: List[int] = None,
        **kwargs: Any
    ):
        super().__init__()

        if dilations is None:
            dilations = [1, 1, 1, 1]
        assert len(dilations) >= 4, ''

        FRONT_S = 1 if thumbnail else 2

        self.layers = layers
        self.groups = groups
        self.width_per_group = width_per_group
        self.block = block
        self.ratio = rd_ratio
        self.drop_path_rate = drop_path_rate
        self.use_resnetd_shortcut = use_resnetd_shortcut
        self.version = 1
        if issubclass(block, (blocks.ResBasicBlockV2, blocks.BottleneckV2)):
            self.version = 2

        if use_resnetc_stem:
            stem = blocks.Stage(
                blocks.Conv2d3x3(in_channels, 64, stride=FRONT_S),
                *blocks.norm_activation(64),
                blocks.Conv2d3x3(64, 64),
                *blocks.norm_activation(64),
                blocks.Conv2d3x3(64, 64)
            )
        else:
            stem = blocks.Stage(
                nn.Conv2d(in_channels, 64, 7, FRONT_S, padding=3, bias=False)
            )

        if self.version == 1 or replace_stem_max_pool:
            stem.append(blocks.norm_activation(64))

        stage1 = blocks.Stage()
        if replace_stem_max_pool:
            stage1.append(blocks.Conv2d3x3(64, 64, stride=FRONT_S))
            if self.version == 1:
                stage1.append(blocks.norm_activation(64))
        elif not thumbnail:
            stage1.append(nn.MaxPool2d(3, stride=2, padding=1))

        stage1.append(self.make_layers(64 // block.expansion, 64, 1, layers[0], 2, dilations[0]))

        self.features = nn.Sequential(OrderedDict([
            ('stem', stem),
            ('stage1', stage1),
            ('stage2', blocks.Stage(self.make_layers(64, 128, 2, layers[1], 3, dilations[1]))),
            ('stage3', blocks.Stage(self.make_layers(128, 256, 2, layers[2], 4, dilations[2]))),
            ('stage4', blocks.Stage(self.make_layers(256, 512, 2, layers[3], 5, dilations[3]))),
        ]))
        
        if self.version == 2:
            self.features[-1].append(blocks.norm_activation(512 * self.block.expansion))
            
        self.pool = nn.AdaptiveAvgPool2d((1, 1))
        self.classifier = nn.Sequential(
            nn.Dropout(dropout_rate, inplace=True),
            nn.Linear(512 * block.expansion, num_classes)
        )

        self.reset_parameters(zero_init_last_bn=zero_init_last_bn)

    def reset_parameters(self, zero_init_last_bn: bool = True) -> None:
        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')
                if m.bias is not None:
                    nn.init.zeros_(m.bias)
            elif isinstance(m, nn.BatchNorm2d):
                nn.init.ones_(m.weight)
                nn.init.zeros_(m.bias)

        # Zero-initialize the last BN in each residual branch,
        # so that the residual branch starts with zeros, and each residual block behaves like an identity.
        # This improves the model by 0.2~0.3% according to https://arxiv.org/abs/1706.02677
        if zero_init_last_bn:
            for m in self.modules():
                if hasattr(m, 'zero_init_last_bn'):
                    m.zero_init_last_bn()

    def forward(self, x):
        x = self.features(x)
        x = self.pool(x)
        x = torch.flatten(x, 1)
        x = self.classifier(x)
        return x

    def get_drop_path_rate(self, block_num: int):
        if self.drop_path_rate is not None:
            return self.drop_path_rate * float(block_num) / (len(self.layers) + 1)
        else:
            return None

    def make_layers(self, inp, oup, stride, n, block_num, dilation):
        layers = []
        inp = inp * self.block.expansion
        for _ in range(n):
            layers.append(
                self.block(
                    inp,
                    oup,
                    stride=stride if dilation == 1 else 1,
                    groups=self.groups,
                    width_per_group=self.width_per_group,
                    rd_ratio=self.ratio,
                    drop_path_rate=self.get_drop_path_rate(block_num),
                    use_resnetd_shortcut=self.use_resnetd_shortcut,
                    dilation=max(1, (dilation//stride))
                )
            )
            inp = oup * self.block.expansion
            stride = 1
        return layers


def _resnet(
    layers: List[int],
    block: nn.Module,
    rd_ratio: float = None,
    pretrained: bool = False,
    pth: str = None,
    progress: bool = False,
    **kwargs: Any
):
    model = ResNet(layers=layers, block=block, rd_ratio=rd_ratio, **kwargs)

    if pretrained:
        load_from_local_or_url(model, pth, kwargs.get('url', None), progress)
    return model


@export
@config(url='https://github.com/ffiirree/cv-models/releases/download/v0.0.2-resnets/resnet18_v1-9f8d6382.pth')
def resnet18_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([2, 2, 2, 2], blocks.ResBasicBlockV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet34_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.ResBasicBlockV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet50_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet101_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 23, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet152_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 8, 36, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet18_v1d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    return _resnet([2, 2, 2, 2], blocks.ResBasicBlockV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet34_v1d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    return _resnet([3, 4, 6, 3], blocks.ResBasicBlockV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet50_v1d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    return _resnet([3, 4, 6, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet101_v1d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    return _resnet([3, 4, 23, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet152_v1d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    return _resnet([3, 8, 36, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet18_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([2, 2, 2, 2], blocks.ResBasicBlockV2, None, pretrained, pth, progress, **kwargs)


@export
def resnet34_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.ResBasicBlockV2, None, pretrained, pth, progress, **kwargs)


@export
def resnet50_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.BottleneckV2, None, pretrained, pth, progress, **kwargs)


@export
def resnet101_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 23, 3], blocks.BottleneckV2, None, pretrained, pth, progress, **kwargs)


@export
def resnet152_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 8, 36, 3], blocks.BottleneckV2, None, pretrained, pth, progress, **kwargs)


@export
def se_resnet18_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([2, 2, 2, 2], blocks.ResBasicBlockV1, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet34_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.ResBasicBlockV1, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet50_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.BottleneckV1, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet101_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 23, 3], blocks.BottleneckV1, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet152_v1(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 8, 36, 3], blocks.BottleneckV1, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet18_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([2, 2, 2, 2], blocks.ResBasicBlockV2, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet34_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.ResBasicBlockV2, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet50_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 6, 3], blocks.BottleneckV2, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet101_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 4, 23, 3], blocks.BottleneckV2, 1/16, pretrained, pth, progress, **kwargs)


@export
def se_resnet152_v2(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    return _resnet([3, 8, 36, 3], blocks.BottleneckV2, 1/16, pretrained, pth, progress, **kwargs)


@export
def resnext50_32x4d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['groups'] = 32
    kwargs['width_per_group'] = 4
    return _resnet([3, 4, 6, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnext101_32x8d(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['groups'] = 32
    kwargs['width_per_group'] = 8
    return _resnet([3, 4, 23, 3], blocks.BottleneckV1, None, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_50(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['dropout_rate'] = 0.25
    return _resnet([3, 4, 6, 3], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_101(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['dropout_rate'] = 0.25
    return _resnet([3, 4, 23, 3], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_152(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['dropout_rate'] = 0.25
    return _resnet([3, 8, 36, 3], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_200(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['drop_path_rate'] = 0.1
    kwargs['dropout_rate'] = 0.25
    return _resnet([3, 24, 36, 3], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_270(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['drop_path_rate'] = 0.1
    kwargs['dropout_rate'] = 0.25
    return _resnet([4, 29, 53, 4], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_350_i256(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['drop_path_rate'] = 0.1
    kwargs['dropout_rate'] = 0.25
    return _resnet([4, 4, 72, 4], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_350_i320(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['drop_path_rate'] = 0.1
    kwargs['dropout_rate'] = 0.4
    return _resnet([4, 4, 72, 4], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)


@export
def resnet_rs_420(pretrained: bool = False, pth: str = None, progress: bool = True, **kwargs: Any):
    kwargs['replace_stem_max_pool'] = True
    kwargs['use_resnetc_stem'] = True
    kwargs['use_resnetd_shortcut'] = True
    kwargs['drop_path_rate'] = 0.1
    kwargs['dropout_rate'] = 0.4
    return _resnet([4, 4, 87, 4], blocks.BottleneckV1, 0.25, pretrained, pth, progress, **kwargs)