Source code for ezflow.modules.blocks

import torch.nn as nn
import torch.nn.functional as F

from ..config import configurable
from .build import MODULE_REGISTRY


[docs]@MODULE_REGISTRY.register()
class BasicBlock(nn.Module):
    """
    Basic residual block for ResNet-style architectures

    Parameters
    ----------
    in_channels : int
        Number of input channels
    out_channels : int
        Number of output channels
    stride : int, optional
        Stride of the convolution
    norm : str, optional
        Normalization method. One of "group", "batch", "instance", or None
    activation : str, optional
        Activation function. One of "relu", "leakyrelu", or None
    """

    @configurable
    def __init__(
        self, in_channels, out_channels, stride=1, norm="group", activation="relu"
    ):
        super(BasicBlock, self).__init__()

        if norm is not None:

            if norm.lower() == "group":
                n_groups = out_channels // 8
                norm1 = nn.GroupNorm(num_groups=n_groups, num_channels=out_channels)
                norm2 = nn.GroupNorm(num_groups=n_groups, num_channels=out_channels)

                if stride != 1:
                    norm3 = nn.GroupNorm(num_groups=n_groups, num_channels=out_channels)

            elif norm.lower() == "batch":
                norm1 = nn.BatchNorm2d(out_channels)
                norm2 = nn.BatchNorm2d(out_channels)

                if stride != 1:
                    norm3 = nn.BatchNorm2d(out_channels)

            elif norm.lower() == "instance":
                norm1 = nn.InstanceNorm2d(out_channels)
                norm2 = nn.InstanceNorm2d(out_channels)

                if stride != 1:
                    norm3 = nn.InstanceNorm2d(out_channels)

            elif norm.lower() == "none":
                norm1 = nn.Identity()
                norm2 = nn.Identity()

                if stride != 1:
                    norm3 = nn.Identity()

        else:
            norm1 = nn.Identity()
            norm2 = nn.Identity()

            if stride != 1:
                norm3 = nn.Identity()

        # Change required
        if activation.lower() == "leakyrelu":
            self.activation = nn.LeakyReLU(negative_slope=0.1, inplace=True)
        else:
            self.activation = nn.ReLU(inplace=True)

        self.residual_fn = nn.Sequential(
            nn.Conv2d(
                in_channels, out_channels, kernel_size=3, padding=1, stride=stride
            ),
            norm1,
            self.activation,
            nn.Conv2d(out_channels, out_channels, kernel_size=3, padding=1),
            norm2,
        )

        self.shortcut = nn.Identity()
        if stride != 1:
            self.shortcut = nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=1, stride=stride),
                norm3,
            )

    @classmethod
    def from_config(cls, cfg):
        return {
            "in_channels": cfg.IN_CHANNELS,
            "out_channels": cfg.OUT_CHANNELS,
            "stride": cfg.STRIDE,
            "norm": cfg.NORM,
            "activation": cfg.ACTIVATION,
        }

[docs]    def forward(self, x):

        out = self.residual_fn(x)
        out = self.activation(out + self.shortcut(x))

        return out


[docs]@MODULE_REGISTRY.register()
class BottleneckBlock(nn.Module):
    """
    Bottleneck residual block for ResNet-style architectures

    Parameters
    ----------
    in_channels : int
        Number of input channels
    out_channels : int
        Number of output channels
    stride : int, optional
        Stride of the convolution
    norm : str, optional
        Normalization method. One of "group", "batch", "instance", or None
    activation : str, optional
        Activation function. One of "relu", "leakyrelu", or None
    """

    @configurable
    def __init__(
        self, in_channels, out_channels, stride=1, norm="group", activation="relu"
    ):
        super(BottleneckBlock, self).__init__()

        if norm is not None:

            if norm.lower() == "group":
                num_groups = out_channels // 8
                norm1 = nn.GroupNorm(
                    num_groups=num_groups, num_channels=out_channels // 4
                )
                norm2 = nn.GroupNorm(
                    num_groups=num_groups, num_channels=out_channels // 4
                )
                norm3 = nn.GroupNorm(num_groups=num_groups, num_channels=out_channels)

                if not stride == 1:
                    norm4 = nn.GroupNorm(
                        num_groups=num_groups, num_channels=out_channels
                    )

            elif norm.lower() == "batch":
                norm1 = nn.BatchNorm2d(out_channels // 4)
                norm2 = nn.BatchNorm2d(out_channels // 4)
                norm3 = nn.BatchNorm2d(out_channels)

                if not stride == 1:
                    norm4 = nn.BatchNorm2d(out_channels)

            elif norm.lower() == "instance":
                norm1 = nn.InstanceNorm2d(out_channels // 4)
                norm2 = nn.InstanceNorm2d(out_channels // 4)
                norm3 = nn.InstanceNorm2d(out_channels)

                if not stride == 1:
                    norm4 = nn.InstanceNorm2d(out_channels)

            elif norm.lower() == "none":
                norm1 = nn.Identity()
                norm2 = nn.Identity()
                norm3 = nn.Identity()

                if not stride == 1:
                    norm4 = nn.Identity()

        else:
            norm1 = nn.Identity()
            norm2 = nn.Identity()
            norm3 = nn.Identity()

            if not stride == 1:
                norm4 = nn.Identity()

        if activation.lower() == "leakyrelu":
            self.activation = nn.LeakyReLU(negative_slope=0.1, inplace=True)
        else:
            self.activation = nn.ReLU(inplace=True)

        self.residual_fn = nn.Sequential(
            nn.Conv2d(in_channels, out_channels // 4, kernel_size=1),
            norm1,
            self.activation,
            nn.Conv2d(
                out_channels // 4,
                out_channels // 4,
                stride=stride,
                kernel_size=3,
                padding=1,
            ),
            norm2,
            self.activation,
            nn.Conv2d(out_channels // 4, out_channels, kernel_size=1),
            norm3,
        )

        self.shortcut = nn.Identity()
        if stride != 1:
            self.shortcut = nn.Sequential(
                nn.Conv2d(in_channels, out_channels, kernel_size=1, stride=stride),
                norm4,
            )

    @classmethod
    def from_config(cls, cfg):
        return {
            "in_channels": cfg.IN_CHANNELS,
            "out_channels": cfg.OUT_CHANNELS,
            "stride": cfg.STRIDE,
            "norm": cfg.NORM,
            "activation": cfg.ACTIVATION,
        }

[docs]    def forward(self, x):

        out = self.residual_fn(x)
        out = self.activation(out + self.shortcut(x))

        return out