dc/de4/models_2backbones_2stgcn_8py_source.html

import torch

import torch.nn as nn


from smaction.utils.gcn_utils import GCNBlock, TCNBlock

from smaction.utils.graph import Graph


class STGCNBlock(nn.Module):

    r"""Applies a spatial temporal graph convolution over an input graph sequence.


    Args:

        in_channels (int): Number of channels in the input sequence data

        out_channels (int): Number of channels produced by the convolution

        kernel_size (tuple): Size of the temporal convolving kernel and graph convolving kernel

        stride (int, optional): Stride of the temporal convolution. Default: 1

        dropout (int, optional): Dropout rate of the final output. Default: 0

        residual (bool, optional): If ``True``, applies a residual mechanism. Default: ``True``


    Shape:

        - Input[0]: Input graph sequence in :math:`(N, in_channels, T_{in}, V)` format

        - Input[1]: Input graph adjacency matrix in :math:`(K, V, V)` format

        - Output[0]: Outpu graph sequence in :math:`(N, out_channels, T_{out}, V)` format

        - Output[1]: Graph adjacency matrix for output data in :math:`(K, V, V)` format


        where

            :math:`N` is a batch size,

            :math:`K` is the spatial kernel size, as :math:`K == kernel_size[1]`,

            :math:`T_{in}/T_{out}` is a length of input/output sequence,

            :math:`V` is the number of graph nodes.


    """


    def __init__(self,

                 in_channels,

                 out_channels,

                 kernel_size,

                 stride=1,

                 dropout=0,

                 residual=True):

        super().__init__()


        assert len(kernel_size) == 2

        assert kernel_size[0] % 2 == 1


        self.gcn = GCNBlock(in_channels, out_channels, kernel_size[1])

        self.tcn = TCNBlock(out_channels, kernel_size[0], stride, dropout)


        if not residual:

            self.residual = lambda x: 0


        elif (in_channels == out_channels) and (stride == 1):

            self.residual = lambda x: x


        else:

            self.residual = nn.Sequential(

                nn.Conv2d(

                    in_channels,

                    out_channels,

                    kernel_size=1,

                    stride=(stride, 1)),

                nn.BatchNorm2d(out_channels),

            )


        self.relu = nn.ReLU(inplace=True)


    def forward(self, x, A):


        res = self.residual(x)

        x, A = self.gcn(x, A)

        x = self.tcn(x) + res


        return self.relu(x), A


class STGCN(nn.Module):

    r"""Spatial temporal graph convolutional networks.


    Args:

        in_channels (int): Number of channels in the input data

        num_class (int): Number of classes for the classification task

        graph_args (dict): The arguments for building the graph

        edge_importance_weighting (bool): If ``True``, adds a learnable

            importance weighting to the edges of the graph

        **kwargs (optional): Other parameters for graph convolution units


    Shape:

        - Input: :math:`(N, in_channels, T_{in}, V_{in}, M_{in})`

        - Output: :math:`(N, num_class)` where

            :math:`N` is a batch size,

            :math:`T_{in}` is a length of input sequence,

            :math:`V_{in}` is the number of graph nodes,

            :math:`M_{in}` is the number of instance in a frame.

    """


    def __init__(self, in_channels, graph_args,

                 edge_importance_weighting, input_key, **kwargs):

        super().__init__()


        # load graph

        self.graph = Graph(**graph_args)

        A = torch.tensor(self.graph.A, dtype=torch.float32, requires_grad=False)

        self.register_buffer('A', A)


        # build networks

        spatial_kernel_size = A.size(0)

        temporal_kernel_size = 9

        kernel_size = (temporal_kernel_size, spatial_kernel_size)

        self.data_bn = nn.BatchNorm1d(in_channels * A.size(1))

        kwargs0 = {k: v for k, v in kwargs.items() if k != 'dropout'}

        self.st_gcn_networks = nn.ModuleList((

            STGCNBlock(in_channels, 64, kernel_size, 1, residual=False, **kwargs0),

            STGCNBlock(64, 64, kernel_size, 1, **kwargs),

            STGCNBlock(64, 64, kernel_size, 1, **kwargs),

            STGCNBlock(64, 64, kernel_size, 1, **kwargs),

            STGCNBlock(64, 128, kernel_size, 2, **kwargs),

            STGCNBlock(128, 128, kernel_size, 1, **kwargs),

            STGCNBlock(128, 128, kernel_size, 1, **kwargs),

            STGCNBlock(128, 256, kernel_size, 2, **kwargs),

            STGCNBlock(256, 256, kernel_size, 1, **kwargs),

            STGCNBlock(256, 256, kernel_size, 1, **kwargs),

        ))


        # initialize parameters for edge importance weighting

        if edge_importance_weighting:

            self.edge_importance = nn.ParameterList([

                nn.Parameter(torch.ones(self.A.size()))

                for i in self.st_gcn_networks

            ])

        else:

            self.edge_importance = [1] * len(self.st_gcn_networks)


        self.input_key = input_key


    def forward(self, sample_dict):

        x = sample_dict[self.input_key]

        # data normalization

        # N, C, T, V, M = x.size()  # -> N, M, V, C, T

        # x = x.permute(0, 4, 3, 1, 2).contiguous()

        # x = x.view(N * M, V * C, T)

        # x = self.data_bn(x)

        # x = x.view(N, M, V, C, T) #-> N, M, C, T, V

        # x = x.permute(0, 1, 3, 4, 2).contiguous()

        # x = x.view(N * M, C, T, V)


        N, T, V, C = x.size() # -> N, V, C, T

        x = x.permute(0, 2, 3, 1).contiguous()

        x = x.view(N, V * C, T)


        x = self.data_bn(x)

        x = x.view(N, V, C, T)

        x = x.permute(0, 2, 3, 1).contiguous() # N, C, T, V


        # forwad

        for gcn, importance in zip(self.st_gcn_networks, self.edge_importance):

            x, _ = gcn(x, self.A * importance)


        # x = x.reshape((N, M) + x.shape[1:])

        return x


stgcn.STGCNBlock
Definition stgcn.py:7

stgcn.STGCNBlock.forward
forward(self, x, A)
Definition stgcn.py:65

stgcn.STGCNBlock.residual
residual
Definition stgcn.py:48

stgcn.STGCNBlock.__init__
__init__(self, in_channels, out_channels, kernel_size, stride=1, dropout=0, residual=True)
Definition stgcn.py:38

stgcn.STGCNBlock.tcn
tcn
Definition stgcn.py:45

stgcn.STGCNBlock.relu
relu
Definition stgcn.py:63

stgcn.STGCNBlock.gcn
gcn
Definition stgcn.py:44

stgcn.STGCN
Definition stgcn.py:73

stgcn.STGCN.__init__
__init__(self, in_channels, graph_args, edge_importance_weighting, input_key, **kwargs)
Definition stgcn.py:94

stgcn.STGCN.input_key
input_key
Definition stgcn.py:130

stgcn.STGCN.graph
graph
Definition stgcn.py:98

stgcn.STGCN.st_gcn_networks
st_gcn_networks
Definition stgcn.py:108

stgcn.STGCN.forward
forward(self, sample_dict)
Definition stgcn.py:132

stgcn.STGCN.edge_importance
edge_importance
Definition stgcn.py:123

stgcn.STGCN.data_bn
data_bn
Definition stgcn.py:106

torch.nn