d7/d4d/mgn_8py_source.html

# encoding: utf-8

"""

@author:  liaoxingyu

@contact: sherlockliao01@gmail.com

"""

import copy


import torch

from torch import nn


from fastreid.layers import get_norm

from fastreid.modeling.backbones import build_backbone

from fastreid.modeling.backbones.resnet import Bottleneck

from fastreid.modeling.heads import build_heads

from fastreid.modeling.losses import *

from .build import META_ARCH_REGISTRY


@META_ARCH_REGISTRY.register()


class MGN(nn.Module):


    def __init__(self, cfg):

        super().__init__()

        self._cfg = cfg

        assert len(cfg.MODEL.PIXEL_MEAN) == len(cfg.MODEL.PIXEL_STD)

        self.register_buffer("pixel_mean", torch.Tensor(cfg.MODEL.PIXEL_MEAN).view(1, -1, 1, 1))

        self.register_buffer("pixel_std", torch.Tensor(cfg.MODEL.PIXEL_STD).view(1, -1, 1, 1))


        # fmt: off

        # backbone

        bn_norm    = cfg.MODEL.BACKBONE.NORM

        with_se    = cfg.MODEL.BACKBONE.WITH_SE

        extra_bn   = cfg.MODEL.BACKBONE.EXTRA_BN

        # fmt :on


        backbone = build_backbone(cfg)

        self.backbone = nn.Sequential(

            backbone.conv1,

            backbone.bn1,

            backbone.relu,

            backbone.maxpool,

            backbone.layer1,

            backbone.layer2,

            backbone.layer3[0]

        )

        res_conv4 = nn.Sequential(*backbone.layer3[1:])

        res_g_conv5 = backbone.layer4


        res_p_conv5 = nn.Sequential(

            Bottleneck(1024, 512, bn_norm, False, with_se, downsample=nn.Sequential(

                nn.Conv2d(1024, 2048, 1, bias=False), get_norm(bn_norm, 2048))),

            Bottleneck(2048, 512, bn_norm, False, with_se),

            Bottleneck(2048, 512, bn_norm, False, with_se))

        res_p_conv5.load_state_dict(backbone.layer4.state_dict())


        # branch1

        self.b1 = nn.Sequential(

            copy.deepcopy(res_conv4),

            copy.deepcopy(res_g_conv5)

        )

        self.b1_head = build_heads(cfg)


        # branch2

        self.b2 = nn.Sequential(

            copy.deepcopy(res_conv4),

            copy.deepcopy(res_p_conv5)

        )

        self.b2_head = build_heads(cfg)

        self.b21_head = build_heads(cfg)

        self.b22_head = build_heads(cfg)


        # branch3

        self.b3 = nn.Sequential(

            copy.deepcopy(res_conv4),

            copy.deepcopy(res_p_conv5)

        )

        self.b3_head = build_heads(cfg)

        self.b31_head = build_heads(cfg)

        self.b32_head = build_heads(cfg)

        self.b33_head = build_heads(cfg)


        self.has_extra_bn = extra_bn

        if extra_bn:

            self.heads_extra_bn_b1 = get_norm(bn_norm, 2048)

            self.heads_extra_bn_b2 = get_norm(bn_norm, 2048)

            self.heads_extra_bn_b3 = get_norm(bn_norm, 2048)


    @property


    def device(self):

        return self.pixel_mean.device


    def forward(self, batched_inputs):

        images = self.preprocess_image(batched_inputs)

        features = self.backbone(images)  # (bs, 2048, 16, 8)


        # branch1

        b1_feat = self.b1(features)

        if self.has_extra_bn: b1_feat = self.heads_extra_bn_b1(b1_feat)


        # branch2

        b2_feat = self.b2(features)

        if self.has_extra_bn: b2_feat = self.heads_extra_bn_b2(b2_feat)

        b21_feat, b22_feat = torch.chunk(b2_feat, 2, dim=2)


        # branch3

        b3_feat = self.b3(features)

        if self.has_extra_bn: b3_feat = self.heads_extra_bn_b3(b3_feat)

        b31_feat, b32_feat, b33_feat = torch.chunk(b3_feat, 3, dim=2)


        if self.training:

            assert "targets" in batched_inputs, "Person ID annotation are missing in training!"

            targets = batched_inputs["targets"].long().to(self.device)


            if targets.sum() < 0: targets.zero_()


            b1_outputs = self.b1_head(b1_feat, targets)

            b2_outputs = self.b2_head(b2_feat, targets)

            b21_outputs = self.b21_head(b21_feat, targets)

            b22_outputs = self.b22_head(b22_feat, targets)

            b3_outputs = self.b3_head(b3_feat, targets)

            b31_outputs = self.b31_head(b31_feat, targets)

            b32_outputs = self.b32_head(b32_feat, targets)

            b33_outputs = self.b33_head(b33_feat, targets)


            return {

                "b1_outputs": b1_outputs,

                "b2_outputs": b2_outputs,

                "b21_outputs": b21_outputs,

                "b22_outputs": b22_outputs,

                "b3_outputs": b3_outputs,

                "b31_outputs": b31_outputs,

                "b32_outputs": b32_outputs,

                "b33_outputs": b33_outputs,

                "targets": targets,

            }

        else:

            b1_pool_feat = self.b1_head(b1_feat)

            b2_pool_feat = self.b2_head(b2_feat)

            b21_pool_feat = self.b21_head(b21_feat)

            b22_pool_feat = self.b22_head(b22_feat)

            b3_pool_feat = self.b3_head(b3_feat)

            b31_pool_feat = self.b31_head(b31_feat)

            b32_pool_feat = self.b32_head(b32_feat)

            b33_pool_feat = self.b33_head(b33_feat)


            pred_feat = torch.cat([b1_pool_feat, b2_pool_feat, b3_pool_feat, b21_pool_feat,

                                   b22_pool_feat, b31_pool_feat, b32_pool_feat, b33_pool_feat], dim=1)

            return pred_feat


    def preprocess_image(self, batched_inputs):

        r"""

        Normalize and batch the input images.

        """

        if isinstance(batched_inputs, dict):

            images = batched_inputs["images"].to(self.device)

        elif isinstance(batched_inputs, torch.Tensor):

            images = batched_inputs.to(self.device)

        else:

            raise TypeError("batched_inputs must be dict or torch.Tensor, but get {}".format(type(batched_inputs)))


        images.sub_(self.pixel_mean).div_(self.pixel_std)

        return images


    def losses(self, outs):

        # fmt: off

        b1_outputs        = outs["b1_outputs"]

        b2_outputs        = outs["b2_outputs"]

        b21_outputs       = outs["b21_outputs"]

        b22_outputs       = outs["b22_outputs"]

        b3_outputs        = outs["b3_outputs"]

        b31_outputs       = outs["b31_outputs"]

        b32_outputs       = outs["b32_outputs"]

        b33_outputs       = outs["b33_outputs"]

        gt_labels         = outs["targets"]

        # model predictions

        pred_class_logits = b1_outputs['pred_class_logits'].detach()

        b1_logits         = b1_outputs['cls_outputs']

        b2_logits         = b2_outputs['cls_outputs']

        b21_logits        = b21_outputs['cls_outputs']

        b22_logits        = b22_outputs['cls_outputs']

        b3_logits         = b3_outputs['cls_outputs']

        b31_logits        = b31_outputs['cls_outputs']

        b32_logits        = b32_outputs['cls_outputs']

        b33_logits        = b33_outputs['cls_outputs']

        b1_pool_feat      = b1_outputs['features']

        b2_pool_feat      = b2_outputs['features']

        b3_pool_feat      = b3_outputs['features']

        b21_pool_feat     = b21_outputs['features']

        b22_pool_feat     = b22_outputs['features']

        b31_pool_feat     = b31_outputs['features']

        b32_pool_feat     = b32_outputs['features']

        b33_pool_feat     = b33_outputs['features']

        # fmt: on


        # Log prediction accuracy

        log_accuracy(pred_class_logits, gt_labels)


        b22_pool_feat = torch.cat((b21_pool_feat, b22_pool_feat), dim=1)

        b33_pool_feat = torch.cat((b31_pool_feat, b32_pool_feat, b33_pool_feat), dim=1)


        loss_dict = {}

        loss_names = self._cfg.MODEL.LOSSES.NAME


        if "CrossEntropyLoss" in loss_names:

            loss_dict['loss_cls_b1'] = cross_entropy_loss(

                b1_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b2'] = cross_entropy_loss(

                b2_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b21'] = cross_entropy_loss(

                b21_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b22'] = cross_entropy_loss(

                b22_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b3'] = cross_entropy_loss(

                b3_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b31'] = cross_entropy_loss(

                b31_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b32'] = cross_entropy_loss(

                b32_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125

            loss_dict['loss_cls_b33'] = cross_entropy_loss(

                b33_logits,

                gt_labels,

                self._cfg.MODEL.LOSSES.CE.EPSILON,

                self._cfg.MODEL.LOSSES.CE.ALPHA,

            ) * self._cfg.MODEL.LOSSES.CE.SCALE * 0.125


        if "TripletLoss" in loss_names:

            loss_dict['loss_triplet_b1'] = triplet_loss(

                b1_pool_feat,

                gt_labels,

                self._cfg.MODEL.LOSSES.TRI.MARGIN,

                self._cfg.MODEL.LOSSES.TRI.NORM_FEAT,

                self._cfg.MODEL.LOSSES.TRI.HARD_MINING,

            ) * self._cfg.MODEL.LOSSES.TRI.SCALE * 0.2

            loss_dict['loss_triplet_b2'] = triplet_loss(

                b2_pool_feat,

                gt_labels,

                self._cfg.MODEL.LOSSES.TRI.MARGIN,

                self._cfg.MODEL.LOSSES.TRI.NORM_FEAT,

                self._cfg.MODEL.LOSSES.TRI.HARD_MINING,

            ) * self._cfg.MODEL.LOSSES.TRI.SCALE * 0.2

            loss_dict['loss_triplet_b3'] = triplet_loss(

                b3_pool_feat,

                gt_labels,

                self._cfg.MODEL.LOSSES.TRI.MARGIN,

                self._cfg.MODEL.LOSSES.TRI.NORM_FEAT,

                self._cfg.MODEL.LOSSES.TRI.HARD_MINING,

            ) * self._cfg.MODEL.LOSSES.TRI.SCALE * 0.2

            loss_dict['loss_triplet_b22'] = triplet_loss(

                b22_pool_feat,

                gt_labels,

                self._cfg.MODEL.LOSSES.TRI.MARGIN,

                self._cfg.MODEL.LOSSES.TRI.NORM_FEAT,

                self._cfg.MODEL.LOSSES.TRI.HARD_MINING,

            ) * self._cfg.MODEL.LOSSES.TRI.SCALE * 0.2

            loss_dict['loss_triplet_b33'] = triplet_loss(

                b33_pool_feat,

                gt_labels,

                self._cfg.MODEL.LOSSES.TRI.MARGIN,

                self._cfg.MODEL.LOSSES.TRI.NORM_FEAT,

                self._cfg.MODEL.LOSSES.TRI.HARD_MINING,

            ) * self._cfg.MODEL.LOSSES.TRI.SCALE * 0.2


        return loss_dict


fastreid.modeling.backbones.resnet.Bottleneck
Definition resnet.py:79

fastreid.modeling.meta_arch.mgn.MGN
Definition mgn.py:20

fastreid.modeling.meta_arch.mgn.MGN.b1
b1
Definition mgn.py:56

fastreid.modeling.meta_arch.mgn.MGN.b1_head
b1_head
Definition mgn.py:60

fastreid.modeling.meta_arch.mgn.MGN.has_extra_bn
has_extra_bn
Definition mgn.py:81

fastreid.modeling.meta_arch.mgn.MGN.b3
b3
Definition mgn.py:72

fastreid.modeling.meta_arch.mgn.MGN.b2
b2
Definition mgn.py:63

fastreid.modeling.meta_arch.mgn.MGN.b22_head
b22_head
Definition mgn.py:69

fastreid.modeling.meta_arch.mgn.MGN.b21_head
b21_head
Definition mgn.py:68

fastreid.modeling.meta_arch.mgn.MGN.backbone
backbone
Definition mgn.py:36

fastreid.modeling.meta_arch.mgn.MGN.forward
forward(self, batched_inputs)
Definition mgn.py:91

fastreid.modeling.meta_arch.mgn.MGN.b31_head
b31_head
Definition mgn.py:77

fastreid.modeling.meta_arch.mgn.MGN.b3_head
b3_head
Definition mgn.py:76

fastreid.modeling.meta_arch.mgn.MGN.b32_head
b32_head
Definition mgn.py:78

fastreid.modeling.meta_arch.mgn.MGN._cfg
_cfg
Definition mgn.py:23

fastreid.modeling.meta_arch.mgn.MGN.b33_head
b33_head
Definition mgn.py:79

fastreid.modeling.meta_arch.mgn.MGN.pixel_std
pixel_std
Definition mgn.py:160

fastreid.modeling.meta_arch.mgn.MGN.heads_extra_bn_b2
heads_extra_bn_b2
Definition mgn.py:84

fastreid.modeling.meta_arch.mgn.MGN.preprocess_image
preprocess_image(self, batched_inputs)
Definition mgn.py:149

fastreid.modeling.meta_arch.mgn.MGN.heads_extra_bn_b1
heads_extra_bn_b1
Definition mgn.py:83

fastreid.modeling.meta_arch.mgn.MGN.b2_head
b2_head
Definition mgn.py:67

fastreid.modeling.meta_arch.mgn.MGN.pixel_mean
pixel_mean
Definition mgn.py:160

fastreid.modeling.meta_arch.mgn.MGN.__init__
__init__(self, cfg)
Definition mgn.py:21

fastreid.modeling.meta_arch.mgn.MGN.device
device(self)
Definition mgn.py:88

fastreid.modeling.meta_arch.mgn.MGN.heads_extra_bn_b3
heads_extra_bn_b3
Definition mgn.py:85

fastreid.layers
Definition __init__.py:1

fastreid.modeling.backbones.resnet
Definition resnet.py:1

fastreid.modeling.backbones
Definition __init__.py:1

fastreid.modeling.heads
Definition __init__.py:1

fastreid.modeling.losses
Definition __init__.py:1