Helper Module for Deep Learning.

Source code for pynet.models.unet

# -*- coding: utf-8 -*-
##########################################################################
# NSAp - Copyright (C) CEA, 2019
# Distributed under the terms of the CeCILL-B license, as published by
# the CEA-CNRS-INRIA. Refer to the LICENSE file or to
# http://www.cecill.info/licences/Licence_CeCILL-B_V1-en.html
# for details.
##########################################################################

"""
The U-Net is a convolutional encoder-decoder neural network.
"""

# Imports
import logging
import collections
import torch
import torch.nn as nn
import torch.nn.functional as func
from pynet.interfaces import DeepLearningDecorator
from pynet.utils import Networks
import numpy as np


# Global parameters
logger = logging.getLogger("pynet")


[docs]@Networks.register
@DeepLearningDecorator(family=("encoder", "segmenter"))
class UNet(nn.Module):
    """ UNet.

    The U-Net is a convolutional encoder-decoder neural network.
    Contextual spatial information (from the decoding,
    expansive pathway) about an input tensor is merged with
    information representing the localization of details
    (from the encoding, compressive pathway).
    Modifications to the original paper:

    - padding is used in 3x3x3 convolutions to prevent loss
      of border pixels
    - merging outputs does not require cropping due to (1)
    - residual connections can be used by specifying
      UNet(merge_mode='add')
    - if non-parametric upsampling is used in the decoder
      pathway (specified by upmode='upsample'), then an
      additional 1x1x1 3d convolution occurs after upsampling
      to reduce channel dimensionality by a factor of 2.
      This channel halving happens with the convolution in
      the tranpose convolution (specified by upmode='transpose')
    """

[docs]    def __init__(self, num_classes, in_channels=1, depth=5,
                 start_filts=64, up_mode="transpose",
                 merge_mode="concat", batchnorm=False, dim="3d",
                 input_shape=None):
        """ Init class.

        Parameters
        ----------
        num_classes: int
            the number of features in the output segmentation map.
        in_channels: int, default 1
            number of channels in the input tensor.
        depth: int, default 5
            number of layers in the U-Net.
        start_filts: int, default 64
            number of convolutional filters for the first conv.
        up_mode: string, default 'transpose'
            type of upconvolution. Choices: 'transpose' for transpose
            convolution, 'upsample' for nearest neighbour upsampling.
        merge_mode: str, default 'concat'
            the skip connections merging strategy.
        batchnorm: bool, default False
            normalize the inputs of the activation function.
        dim: str, default '3d'
            '3d' or '2d' input data.
        input_shape: uplet
            the tensor data shape (X, Y, Z) used during upsample (by default
            use a scale factor of 2).
        """
        # Inheritance
        nn.Module.__init__(self)

        # Check inputs
        if dim in ("2d", "3d"):
            self.dim = dim
        else:
            raise ValueError(
                "'{}' is not a valid mode for merging up and down paths. Only "
                "'3d' and '2d' are allowed.".format(dim))
        if up_mode in ("transpose", "upsample"):
            self.up_mode = up_mode
        else:
            raise ValueError(
                "'{}' is not a valid mode for upsampling. Only 'transpose' "
                "and 'upsample' are allowed.".format(up_mode))
        if merge_mode in ("concat", "add"):
            self.merge_mode = merge_mode
        else:
            raise ValueError(
                "'{}' is not a valid mode for merging up and down paths. Only "
                "'concat' and 'add' are allowed.".format(up_mode))
        if self.up_mode == "upsample" and self.merge_mode == "add":
            raise ValueError(
                "up_mode 'upsample' is incompatible with merge_mode 'add' at "
                "the moment because it doesn't make sense to use nearest "
                "neighbour to reduce depth channels (by half).")

        # Declare class parameters
        self.num_classes = num_classes
        self.in_channels = in_channels
        self.start_filts = start_filts
        self.depth = depth
        self.down = []
        self.up = []
        self.shapes = None
        if input_shape is not None:
            self.shapes = self._downsample_shape(
                input_shape, nb_iterations=(depth - 2))
            self.shapes = self.shapes[::-1]

        # Create the encoder pathway
        for cnt in range(depth):
            in_channels = self.in_channels if cnt == 0 else out_channels
            out_channels = self.start_filts * (2**cnt)
            pooling = False if cnt == 0 else True
            self.down.append(
                Down(in_channels, out_channels, self.dim, pooling=pooling,
                     batchnorm=batchnorm))

        # Create the decoder pathway
        # - careful! decoding only requires depth-1 blocks
        for cnt in range(depth - 1):
            in_channels = out_channels
            out_channels = in_channels // 2
            shape = None
            if self.shapes is not None:
                shape = self.shapes[cnt]
            self.up.append(
                Up(in_channels, out_channels, up_mode=up_mode, dim=self.dim,
                   merge_mode=merge_mode, batchnorm=batchnorm, shape=shape))

        # Add the list of modules to current module
        self.down = nn.ModuleList(self.down)
        self.up = nn.ModuleList(self.up)

        # Get ouptut segmentation
        self.conv_final = Conv1x1x1(out_channels, self.num_classes, self.dim)

        # Kernel initializer
        self.kernel_initializer()

    def _downsample_shape(self, shape, nb_iterations=1, scale_factor=2):
        shape = np.asarray(shape)
        all_shapes = [shape.astype(int).tolist()]
        for idx in range(nb_iterations):
            shape = np.floor(shape / scale_factor)
            all_shapes.append(shape.astype(int).tolist())
        return all_shapes

[docs]    def kernel_initializer(self):
        for module in self.modules():
            self.init_weight(module, self.dim)

[docs]    @staticmethod
    def init_weight(module, dim):
        conv_fn = getattr(nn, "Conv{0}".format(dim))
        if isinstance(module, conv_fn):
            nn.init.xavier_normal_(module.weight)
            nn.init.constant_(module.bias, 0)

[docs]    def forward(self, x):
        logger.debug("Unet...")
        logger.debug("  input: {0} - {1} - {2}".format(
            x.shape, x.get_device(), x.dtype))
        encoder_outs = []
        for module in self.down:
            x = module(x)
            logger.debug("  down: {0} - {1} - {2}".format(
                x.shape, x.get_device(), x.dtype))
            encoder_outs.append(x)
        encoder_outs = encoder_outs[:-1][::-1]
        for cnt, module in enumerate(self.up):
            x_up = encoder_outs[cnt]
            logger.debug("  skip: {0} - {1}".format(
                x.shape, x_up.shape))
            x = module(x, x_up)
            logger.debug("  up: {0} - {1} - {2}".format(
                x.shape, x.get_device(), x.dtype))

        # No softmax is used. This means you need to use
        # nn.CrossEntropyLoss in your training script,
        # as this module includes a softmax already.
        x = self.conv_final(x)
        logger.debug("  final: {0} - {1} - {2}".format(
            x.shape, x.get_device(), x.dtype))
        return x


[docs]class DoubleConv(nn.Module):
[docs]    def __init__(self, in_channels, out_channels, dim, kernel_size=3, stride=1,
                 padding=1, bias=True, batchnorm=True):
        super(DoubleConv, self).__init__()
        self.conv_fn = getattr(nn, "Conv{0}".format(dim))
        self.norm_fn = getattr(nn, "BatchNorm{0}".format(dim))
        if batchnorm:
            self.ops = nn.Sequential(collections.OrderedDict([
                ("conv1", self.conv_fn(
                    in_channels, out_channels, kernel_size, stride=stride,
                    padding=padding, bias=bias)),
                ("norm1", self.norm_fn(out_channels)),
                ("leakyrelu1", nn.LeakyReLU()),
                ("conv2", self.conv_fn(
                    out_channels, out_channels, kernel_size, stride=stride,
                    padding=padding, bias=bias)),
                ("norm2", self.norm_fn(out_channels)),
                ("leakyrelu2", nn.LeakyReLU())]))
        else:
            self.ops = nn.Sequential(collections.OrderedDict([
                ("conv1", self.conv_fn(
                    in_channels, out_channels, kernel_size, stride=stride,
                    padding=padding, bias=bias)),
                ("leakyrelu1", nn.LeakyReLU()),
                ("conv2", self.conv_fn(
                    out_channels, out_channels, kernel_size, stride=stride,
                    padding=padding, bias=bias)),
                ("leakyrelu2", nn.LeakyReLU())]))

[docs]    def forward(self, x):
        x = self.ops(x)
        return x


[docs]def UpConv(in_channels, out_channels, dim, mode="transpose", shape=None):
    convt_fn = getattr(nn, "ConvTranspose{0}".format(dim))
    if mode == "transpose":
        return convt_fn(
            in_channels, out_channels, kernel_size=2, stride=2)
    else:
        if shape is None:
            return nn.Sequential(collections.OrderedDict([
                ("up", nn.Upsample(mode="nearest", scale_factor=2)),
                ("conv1x", Conv1x1x1(in_channels, out_channels, dim))]))
        else:
            return nn.Sequential(collections.OrderedDict([
                ("up", nn.Upsample(mode="nearest", size=shape)),
                ("conv1x", Conv1x1x1(in_channels, out_channels, dim))]))


[docs]def Conv1x1x1(in_channels, out_channels, dim, groups=1):
    conv_fn = getattr(nn, "Conv{0}".format(dim))
    return conv_fn(
        in_channels, out_channels, kernel_size=1, groups=groups, stride=1)


[docs]class Down(nn.Module):
    """
    A helper Module that performs 2 convolutions and 1 MaxPool.
    A LeakyReLU activation and optionally a BatchNorm follows each convolution.
    """
[docs]    def __init__(self, in_channels, out_channels, dim, pooling=True,
                 batchnorm=True):
        super(Down, self).__init__()
        self.pool_fn = getattr(nn, "MaxPool{0}".format(dim))
        if pooling:
            self.ops = nn.Sequential(collections.OrderedDict([
                ("maxpool", self.pool_fn(2)),
                ("doubleconv", DoubleConv(
                    in_channels, out_channels, dim, batchnorm=batchnorm))]))
        else:
            self.ops = nn.Sequential(collections.OrderedDict([
                ("doubleconv", DoubleConv(
                    in_channels, out_channels, dim, batchnorm=batchnorm))]))

[docs]    def forward(self, x):
        x = self.ops(x)
        return x


[docs]class Up(nn.Module):
    """
    A helper Module that performs 2 convolutions and 1 UpConvolution.
    A LeakyReLU activation and optionally a BatchNorm follows each convolution.
    """
[docs]    def __init__(self, in_channels, out_channels, dim, merge_mode="concat",
                 up_mode="transpose", batchnorm=True, shape=None):
        super(Up, self).__init__()
        self.merge_mode = merge_mode
        if merge_mode in ("concat", "add"):
            self.upconv = UpConv(
                in_channels, out_channels, dim, shape=shape, mode=up_mode)
        else:
            self.upconv = UpConv(
                in_channels, in_channels, dim, shape=shape, mode=up_mode)
        self.doubleconv = DoubleConv(
            in_channels, out_channels, dim, batchnorm=batchnorm)

[docs]    def forward(self, x_down, x_up=None):
        x_down = self.upconv(x_down)
        if self.merge_mode == "concat":
            x = torch.cat((x_up, x_down), dim=1)
        elif self.merge_mode == "add":
            x = x_up + x_down
        else:
            x = x_down
        x = self.doubleconv(x)
        return x
Helper Module for Deep Learning.

Source code for pynet.models.unet

Follow us