d8/ddf/osnet_8py_source.html

# encoding: utf-8

"""

@author:  xingyu liao

@contact: sherlockliao01@gmail.com

"""


# based on:

# https://github.com/KaiyangZhou/deep-person-reid/blob/master/torchreid/models/osnet.py


import logging


import torch

from torch import nn


from fastreid.layers import get_norm

from fastreid.utils import comm

from .build import BACKBONE_REGISTRY


logger = logging.getLogger(__name__)

model_urls = {

    'osnet_x1_0':

        'https://drive.google.com/uc?id=1LaG1EJpHrxdAxKnSCJ_i0u-nbxSAeiFY',

    'osnet_x0_75':

        'https://drive.google.com/uc?id=1uwA9fElHOk3ZogwbeY5GkLI6QPTX70Hq',

    'osnet_x0_5':

        'https://drive.google.com/uc?id=16DGLbZukvVYgINws8u8deSaOqjybZ83i',

    'osnet_x0_25':

        'https://drive.google.com/uc?id=1rb8UN5ZzPKRc_xvtHlyDh-cSz88YX9hs',

    'osnet_ibn_x1_0':

        'https://drive.google.com/uc?id=1sr90V6irlYYDd4_4ISU2iruoRG8J__6l'

}


class ConvLayer(nn.Module):

    """Convolution layer (conv + bn + relu)."""


    def __init__(

            self,

            in_channels,

            out_channels,

            kernel_size,

            bn_norm,

            stride=1,

            padding=0,

            groups=1,

            IN=False

    ):

        super(ConvLayer, self).__init__()

        self.conv = nn.Conv2d(

            in_channels,

            out_channels,

            kernel_size,

            stride=stride,

            padding=padding,

            bias=False,

            groups=groups

        )

        if IN:

            self.bn = nn.InstanceNorm2d(out_channels, affine=True)

        else:

            self.bn = get_norm(bn_norm, out_channels)

        self.relu = nn.ReLU(inplace=True)


    def forward(self, x):

        x = self.conv(x)

        x = self.bn(x)

        x = self.relu(x)

        return x


class Conv1x1(nn.Module):

    """1x1 convolution + bn + relu."""


    def __init__(self, in_channels, out_channels, bn_norm, stride=1, groups=1):

        super(Conv1x1, self).__init__()

        self.conv = nn.Conv2d(

            in_channels,

            out_channels,

            1,

            stride=stride,

            padding=0,

            bias=False,

            groups=groups

        )

        self.bn = get_norm(bn_norm, out_channels)

        self.relu = nn.ReLU(inplace=True)


    def forward(self, x):

        x = self.conv(x)

        x = self.bn(x)

        x = self.relu(x)

        return x


class Conv1x1Linear(nn.Module):

    """1x1 convolution + bn (w/o non-linearity)."""


    def __init__(self, in_channels, out_channels, bn_norm, stride=1):

        super(Conv1x1Linear, self).__init__()

        self.conv = nn.Conv2d(

            in_channels, out_channels, 1, stride=stride, padding=0, bias=False

        )

        self.bn = get_norm(bn_norm, out_channels)


    def forward(self, x):

        x = self.conv(x)

        x = self.bn(x)

        return x


class Conv3x3(nn.Module):

    """3x3 convolution + bn + relu."""


    def __init__(self, in_channels, out_channels, bn_norm, stride=1, groups=1):

        super(Conv3x3, self).__init__()

        self.conv = nn.Conv2d(

            in_channels,

            out_channels,

            3,

            stride=stride,

            padding=1,

            bias=False,

            groups=groups

        )

        self.bn = get_norm(bn_norm, out_channels)

        self.relu = nn.ReLU(inplace=True)


    def forward(self, x):

        x = self.conv(x)

        x = self.bn(x)

        x = self.relu(x)

        return x


class LightConv3x3(nn.Module):

    """Lightweight 3x3 convolution.

    1x1 (linear) + dw 3x3 (nonlinear).

    """


    def __init__(self, in_channels, out_channels, bn_norm):

        super(LightConv3x3, self).__init__()

        self.conv1 = nn.Conv2d(

            in_channels, out_channels, 1, stride=1, padding=0, bias=False

        )

        self.conv2 = nn.Conv2d(

            out_channels,

            out_channels,

            3,

            stride=1,

            padding=1,

            bias=False,

            groups=out_channels

        )

        self.bn = get_norm(bn_norm, out_channels)

        self.relu = nn.ReLU(inplace=True)


    def forward(self, x):

        x = self.conv1(x)

        x = self.conv2(x)

        x = self.bn(x)

        x = self.relu(x)

        return x


class ChannelGate(nn.Module):

    """A mini-network that generates channel-wise gates conditioned on input tensor."""


    def __init__(

            self,

            in_channels,

            num_gates=None,

            return_gates=False,

            gate_activation='sigmoid',

            reduction=16,

            layer_norm=False

    ):

        super(ChannelGate, self).__init__()

        if num_gates is None: num_gates = in_channels

        self.return_gates = return_gates


        self.global_avgpool = nn.AdaptiveAvgPool2d(1)


        self.fc1 = nn.Conv2d(

            in_channels,

            in_channels // reduction,

            kernel_size=1,

            bias=True,

            padding=0

        )

        self.norm1 = None

        if layer_norm: self.norm1 = nn.LayerNorm((in_channels // reduction, 1, 1))

        self.relu = nn.ReLU(inplace=True)

        self.fc2 = nn.Conv2d(

            in_channels // reduction,

            num_gates,

            kernel_size=1,

            bias=True,

            padding=0

        )

        if gate_activation == 'sigmoid':

            self.gate_activation = nn.Sigmoid()

        elif gate_activation == 'relu':

            self.gate_activation = nn.ReLU(inplace=True)

        elif gate_activation == 'linear':

            self.gate_activation = nn.Identity()

        else:

            raise RuntimeError(

                "Unknown gate activation: {}".format(gate_activation)

            )


    def forward(self, x):

        input = x

        x = self.global_avgpool(x)

        x = self.fc1(x)

        if self.norm1 is not None: x = self.norm1(x)

        x = self.relu(x)

        x = self.fc2(x)

        x = self.gate_activation(x)

        if self.return_gates: return x

        return input * x


class OSBlock(nn.Module):

    """Omni-scale feature learning block."""


    def __init__(

            self,

            in_channels,

            out_channels,

            bn_norm,

            IN=False,

            bottleneck_reduction=4,

            **kwargs

    ):

        super(OSBlock, self).__init__()

        mid_channels = out_channels // bottleneck_reduction

        self.conv1 = Conv1x1(in_channels, mid_channels, bn_norm)

        self.conv2a = LightConv3x3(mid_channels, mid_channels, bn_norm)

        self.conv2b = nn.Sequential(

            LightConv3x3(mid_channels, mid_channels, bn_norm),

            LightConv3x3(mid_channels, mid_channels, bn_norm),

        )

        self.conv2c = nn.Sequential(

            LightConv3x3(mid_channels, mid_channels, bn_norm),

            LightConv3x3(mid_channels, mid_channels, bn_norm),

            LightConv3x3(mid_channels, mid_channels, bn_norm),

        )

        self.conv2d = nn.Sequential(

            LightConv3x3(mid_channels, mid_channels, bn_norm),

            LightConv3x3(mid_channels, mid_channels, bn_norm),

            LightConv3x3(mid_channels, mid_channels, bn_norm),

            LightConv3x3(mid_channels, mid_channels, bn_norm),

        )

        self.gate = ChannelGate(mid_channels)

        self.conv3 = Conv1x1Linear(mid_channels, out_channels, bn_norm)

        self.downsample = None

        if in_channels != out_channels:

            self.downsample = Conv1x1Linear(in_channels, out_channels, bn_norm)

        self.IN = None

        if IN: self.IN = nn.InstanceNorm2d(out_channels, affine=True)

        self.relu = nn.ReLU(True)


    def forward(self, x):

        identity = x

        x1 = self.conv1(x)

        x2a = self.conv2a(x1)

        x2b = self.conv2b(x1)

        x2c = self.conv2c(x1)

        x2d = self.conv2d(x1)

        x2 = self.gate(x2a) + self.gate(x2b) + self.gate(x2c) + self.gate(x2d)

        x3 = self.conv3(x2)

        if self.downsample is not None:

            identity = self.downsample(identity)

        out = x3 + identity

        if self.IN is not None:

            out = self.IN(out)

        return self.relu(out)


class OSNet(nn.Module):

    """Omni-Scale Network.


    Reference:

        - Zhou et al. Omni-Scale Feature Learning for Person Re-Identification. ICCV, 2019.

        - Zhou et al. Learning Generalisable Omni-Scale Representations

          for Person Re-Identification. arXiv preprint, 2019.

    """


    def __init__(

            self,

            blocks,

            layers,

            channels,

            bn_norm,

            IN=False,

            **kwargs

    ):

        super(OSNet, self).__init__()

        num_blocks = len(blocks)

        assert num_blocks == len(layers)

        assert num_blocks == len(channels) - 1


        # convolutional backbone

        self.conv1 = ConvLayer(3, channels[0], 7, bn_norm, stride=2, padding=3, IN=IN)

        self.maxpool = nn.MaxPool2d(3, stride=2, padding=1)

        self.conv2 = self._make_layer(

            blocks[0],

            layers[0],

            channels[0],

            channels[1],

            bn_norm,

            reduce_spatial_size=True,

            IN=IN

        )

        self.conv3 = self._make_layer(

            blocks[1],

            layers[1],

            channels[1],

            channels[2],

            bn_norm,

            reduce_spatial_size=True

        )

        self.conv4 = self._make_layer(

            blocks[2],

            layers[2],

            channels[2],

            channels[3],

            bn_norm,

            reduce_spatial_size=False

        )

        self.conv5 = Conv1x1(channels[3], channels[3], bn_norm)


        self._init_params()


    def _make_layer(

            self,

            block,

            layer,

            in_channels,

            out_channels,

            bn_norm,

            reduce_spatial_size,

            IN=False

    ):

        layers = []


        layers.append(block(in_channels, out_channels, bn_norm, IN=IN))

        for i in range(1, layer):

            layers.append(block(out_channels, out_channels, bn_norm, IN=IN))


        if reduce_spatial_size:

            layers.append(

                nn.Sequential(

                    Conv1x1(out_channels, out_channels, bn_norm),

                    nn.AvgPool2d(2, stride=2),

                )

            )


        return nn.Sequential(*layers)


    def _init_params(self):

        for m in self.modules():

            if isinstance(m, nn.Conv2d):

                nn.init.kaiming_normal_(

                    m.weight, mode='fan_out', nonlinearity='relu'

                )

                if m.bias is not None:

                    nn.init.constant_(m.bias, 0)


            elif isinstance(m, nn.BatchNorm2d):

                nn.init.constant_(m.weight, 1)

                nn.init.constant_(m.bias, 0)


            elif isinstance(m, nn.BatchNorm1d):

                nn.init.constant_(m.weight, 1)

                nn.init.constant_(m.bias, 0)


            elif isinstance(m, nn.Linear):

                nn.init.normal_(m.weight, 0, 0.01)

                if m.bias is not None:

                    nn.init.constant_(m.bias, 0)


    def forward(self, x):

        x = self.conv1(x)

        x = self.maxpool(x)

        x = self.conv2(x)

        x = self.conv3(x)

        x = self.conv4(x)

        x = self.conv5(x)

        return x


def init_pretrained_weights(model, key=''):

    """Initializes model with pretrained weights.


    Layers that don't match with pretrained layers in name or size are kept unchanged.

    """

    import os

    import errno

    import gdown

    from collections import OrderedDict

    import warnings

    import logging


    logger = logging.getLogger(__name__)


    def _get_torch_home():

        ENV_TORCH_HOME = 'TORCH_HOME'

        ENV_XDG_CACHE_HOME = 'XDG_CACHE_HOME'

        DEFAULT_CACHE_DIR = '~/.cache'

        torch_home = os.path.expanduser(

            os.getenv(

                ENV_TORCH_HOME,

                os.path.join(

                    os.getenv(ENV_XDG_CACHE_HOME, DEFAULT_CACHE_DIR), 'torch'

                )

            )

        )

        return torch_home


    torch_home = _get_torch_home()

    model_dir = os.path.join(torch_home, 'checkpoints')

    try:

        os.makedirs(model_dir)

    except OSError as e:

        if e.errno == errno.EEXIST:

            # Directory already exists, ignore.

            pass

        else:

            # Unexpected OSError, re-raise.

            raise

    filename = key + '_imagenet.pth'

    cached_file = os.path.join(model_dir, filename)


    if not os.path.exists(cached_file):

        if comm.is_main_process():

            gdown.download(model_urls[key], cached_file, quiet=False)


    comm.synchronize()


    state_dict = torch.load(cached_file, map_location=torch.device('cpu'))

    model_dict = model.state_dict()

    new_state_dict = OrderedDict()

    matched_layers, discarded_layers = [], []


    for k, v in state_dict.items():

        if k.startswith('module.'):

            k = k[7:]  # discard module.


        if k in model_dict and model_dict[k].size() == v.size():

            new_state_dict[k] = v

            matched_layers.append(k)

        else:

            discarded_layers.append(k)


    model_dict.update(new_state_dict)

    model.load_state_dict(model_dict)


    if len(matched_layers) == 0:

        warnings.warn(

            'The pretrained weights from "{}" cannot be loaded, '

            'please check the key names manually '

            '(** ignored and continue **)'.format(cached_file)

        )

    else:

        logger.info(

            'Successfully loaded imagenet pretrained weights from "{}"'.format(cached_file)

        )

        if len(discarded_layers) > 0:

            logger.info(

                '** The following layers are discarded '

                'due to unmatched keys or layer size: {}'.format(discarded_layers)

            )


@BACKBONE_REGISTRY.register()


def build_osnet_backbone(cfg):

    """

    Create a OSNet instance from config.

    Returns:

        OSNet: a :class:`OSNet` instance

    """


    # fmt: off

    pretrain      = cfg.MODEL.BACKBONE.PRETRAIN

    pretrain_path = cfg.MODEL.BACKBONE.PRETRAIN_PATH

    with_ibn      = cfg.MODEL.BACKBONE.WITH_IBN

    bn_norm       = cfg.MODEL.BACKBONE.NORM

    depth         = cfg.MODEL.BACKBONE.DEPTH

    # fmt: on


    num_blocks_per_stage = [2, 2, 2]

    num_channels_per_stage = {

        "x1_0": [64, 256, 384, 512],

        "x0_75": [48, 192, 288, 384],

        "x0_5": [32, 128, 192, 256],

        "x0_25": [16, 64, 96, 128]}[depth]

    model = OSNet([OSBlock, OSBlock, OSBlock], num_blocks_per_stage, num_channels_per_stage,

                  bn_norm, IN=with_ibn)


    if pretrain:

        # Load pretrain path if specifically

        if pretrain_path:

            try:

                state_dict = torch.load(pretrain_path, map_location=torch.device('cpu'))

                logger.info(f"Loading pretrained model from {pretrain_path}")

                model.load_state_dict(state_dict)

            except FileNotFoundError as e:

                logger.info(f'{pretrain_path} is not found! Please check this path.')

                raise e

            except KeyError as e:

                logger.info("State dict keys error! Please check the state dict.")

                raise e

        else:

            if with_ibn:

                pretrain_key = "osnet_ibn_" + depth

            else:

                pretrain_key = "osnet_" + depth


            init_pretrained_weights(model, pretrain_key)

    return model


fastreid.modeling.backbones.osnet.ChannelGate
Definition osnet.py:171

fastreid.modeling.backbones.osnet.ChannelGate.fc1
fc1
Definition osnet.py:189

fastreid.modeling.backbones.osnet.ChannelGate.norm1
norm1
Definition osnet.py:196

fastreid.modeling.backbones.osnet.ChannelGate.fc2
fc2
Definition osnet.py:199

fastreid.modeling.backbones.osnet.ChannelGate.__init__
__init__(self, in_channels, num_gates=None, return_gates=False, gate_activation='sigmoid', reduction=16, layer_norm=False)
Definition osnet.py:182

fastreid.modeling.backbones.osnet.ChannelGate.global_avgpool
global_avgpool
Definition osnet.py:187

fastreid.modeling.backbones.osnet.ChannelGate.return_gates
return_gates
Definition osnet.py:185

fastreid.modeling.backbones.osnet.ChannelGate.relu
relu
Definition osnet.py:198

fastreid.modeling.backbones.osnet.ChannelGate.forward
forward(self, x)
Definition osnet.py:217

fastreid.modeling.backbones.osnet.ChannelGate.gate_activation
gate_activation
Definition osnet.py:207

fastreid.modeling.backbones.osnet.Conv1x1
Definition osnet.py:74

fastreid.modeling.backbones.osnet.Conv1x1.forward
forward(self, x)
Definition osnet.py:91

fastreid.modeling.backbones.osnet.Conv1x1.relu
relu
Definition osnet.py:89

fastreid.modeling.backbones.osnet.Conv1x1.conv
conv
Definition osnet.py:79

fastreid.modeling.backbones.osnet.Conv1x1.__init__
__init__(self, in_channels, out_channels, bn_norm, stride=1, groups=1)
Definition osnet.py:77

fastreid.modeling.backbones.osnet.Conv1x1.bn
bn
Definition osnet.py:88

fastreid.modeling.backbones.osnet.Conv1x1Linear
Definition osnet.py:98

fastreid.modeling.backbones.osnet.Conv1x1Linear.conv
conv
Definition osnet.py:103

fastreid.modeling.backbones.osnet.Conv1x1Linear.__init__
__init__(self, in_channels, out_channels, bn_norm, stride=1)
Definition osnet.py:101

fastreid.modeling.backbones.osnet.Conv1x1Linear.bn
bn
Definition osnet.py:106

fastreid.modeling.backbones.osnet.Conv1x1Linear.forward
forward(self, x)
Definition osnet.py:108

fastreid.modeling.backbones.osnet.Conv3x3
Definition osnet.py:114

fastreid.modeling.backbones.osnet.Conv3x3.relu
relu
Definition osnet.py:129

fastreid.modeling.backbones.osnet.Conv3x3.forward
forward(self, x)
Definition osnet.py:131

fastreid.modeling.backbones.osnet.Conv3x3.__init__
__init__(self, in_channels, out_channels, bn_norm, stride=1, groups=1)
Definition osnet.py:117

fastreid.modeling.backbones.osnet.Conv3x3.bn
bn
Definition osnet.py:128

fastreid.modeling.backbones.osnet.Conv3x3.conv
conv
Definition osnet.py:119

fastreid.modeling.backbones.osnet.ConvLayer
Basic layers.
Definition osnet.py:37

fastreid.modeling.backbones.osnet.ConvLayer.forward
forward(self, x)
Definition osnet.py:67

fastreid.modeling.backbones.osnet.ConvLayer.relu
relu
Definition osnet.py:65

fastreid.modeling.backbones.osnet.ConvLayer.bn
bn
Definition osnet.py:62

fastreid.modeling.backbones.osnet.ConvLayer.conv
conv
Definition osnet.py:52

fastreid.modeling.backbones.osnet.ConvLayer.__init__
__init__(self, in_channels, out_channels, kernel_size, bn_norm, stride=1, padding=0, groups=1, IN=False)
Definition osnet.py:50

fastreid.modeling.backbones.osnet.LightConv3x3
Definition osnet.py:138

fastreid.modeling.backbones.osnet.LightConv3x3.conv1
conv1
Definition osnet.py:145

fastreid.modeling.backbones.osnet.LightConv3x3.bn
bn
Definition osnet.py:157

fastreid.modeling.backbones.osnet.LightConv3x3.forward
forward(self, x)
Definition osnet.py:160

fastreid.modeling.backbones.osnet.LightConv3x3.relu
relu
Definition osnet.py:158

fastreid.modeling.backbones.osnet.LightConv3x3.__init__
__init__(self, in_channels, out_channels, bn_norm)
Definition osnet.py:143

fastreid.modeling.backbones.osnet.LightConv3x3.conv2
conv2
Definition osnet.py:148

fastreid.modeling.backbones.osnet.OSBlock
Definition osnet.py:229

fastreid.modeling.backbones.osnet.OSBlock.downsample
downsample
Definition osnet.py:262

fastreid.modeling.backbones.osnet.OSBlock.relu
relu
Definition osnet.py:267

fastreid.modeling.backbones.osnet.OSBlock.gate
gate
Definition osnet.py:260

fastreid.modeling.backbones.osnet.OSBlock.conv2a
conv2a
Definition osnet.py:244

fastreid.modeling.backbones.osnet.OSBlock.__init__
__init__(self, in_channels, out_channels, bn_norm, IN=False, bottleneck_reduction=4, **kwargs)
Definition osnet.py:240

fastreid.modeling.backbones.osnet.OSBlock.forward
forward(self, x)
Definition osnet.py:269

fastreid.modeling.backbones.osnet.OSBlock.conv3
conv3
Definition osnet.py:261

fastreid.modeling.backbones.osnet.OSBlock.conv2b
conv2b
Definition osnet.py:245

fastreid.modeling.backbones.osnet.OSBlock.conv1
conv1
Definition osnet.py:243

fastreid.modeling.backbones.osnet.OSBlock.IN
IN
Definition osnet.py:265

fastreid.modeling.backbones.osnet.OSBlock.conv2c
conv2c
Definition osnet.py:249

fastreid.modeling.backbones.osnet.OSBlock.conv2d
conv2d
Definition osnet.py:254

fastreid.modeling.backbones.osnet.OSNet
Definition osnet.py:289

fastreid.modeling.backbones.osnet.OSNet.conv5
conv5
Definition osnet.py:340

fastreid.modeling.backbones.osnet.OSNet.forward
forward(self, x)
Definition osnet.py:392

fastreid.modeling.backbones.osnet.OSNet._make_layer
_make_layer(self, block, layer, in_channels, out_channels, bn_norm, reduce_spatial_size, IN=False)
Definition osnet.py:353

fastreid.modeling.backbones.osnet.OSNet.conv4
conv4
Definition osnet.py:332

fastreid.modeling.backbones.osnet.OSNet._init_params
_init_params(self)
Definition osnet.py:370

fastreid.modeling.backbones.osnet.OSNet.conv3
conv3
Definition osnet.py:324

fastreid.modeling.backbones.osnet.OSNet.conv1
conv1
Definition osnet.py:313

fastreid.modeling.backbones.osnet.OSNet.conv2
conv2
Definition osnet.py:315

fastreid.modeling.backbones.osnet.OSNet.__init__
__init__(self, blocks, layers, channels, bn_norm, IN=False, **kwargs)
Definition osnet.py:306

fastreid.modeling.backbones.osnet.OSNet.maxpool
maxpool
Definition osnet.py:314

fastreid.layers
Definition __init__.py:1

fastreid.modeling.backbones.osnet.init_pretrained_weights
init_pretrained_weights(model, key='')
Definition osnet.py:402

fastreid.modeling.backbones.osnet.build_osnet_backbone
build_osnet_backbone(cfg)
Definition osnet.py:486

fastreid.utils
Definition __init__.py:1