squeezesegV2.py

#!/usr/bin/env python3
# This file is covered by the LICENSE file in the root of this project.

from __future__ import print_function
import torch
import torch.nn as nn
import torch.nn.functional as F


class Fire(nn.Module):
    def __init__(self, inplanes, squeeze_planes,
                 expand1x1_planes, expand3x3_planes, bn_d=0.1):
        super(Fire, self).__init__()
        self.inplanes = inplanes
        self.bn_d = bn_d
        self.activation = nn.ReLU(inplace=True)
        self.squeeze = nn.Conv2d(inplanes, squeeze_planes, kernel_size=1)
        self.squeeze_bn = nn.BatchNorm2d(squeeze_planes, momentum=self.bn_d)
        self.expand1x1 = nn.Conv2d(squeeze_planes, expand1x1_planes,
                                   kernel_size=1)
        self.expand1x1_bn = nn.BatchNorm2d(
            expand1x1_planes, momentum=self.bn_d)
        self.expand3x3 = nn.Conv2d(squeeze_planes, expand3x3_planes,
                                   kernel_size=3, padding=1)
        self.expand3x3_bn = nn.BatchNorm2d(
            expand3x3_planes, momentum=self.bn_d)

    def forward(self, x):
        x = self.activation(self.squeeze_bn(self.squeeze(x)))
        return torch.cat([
            self.activation(self.expand1x1_bn(self.expand1x1(x))),
            self.activation(self.expand3x3_bn(self.expand3x3(x)))
        ], 1)


class CAM(nn.Module):

    def __init__(self, inplanes, bn_d=0.1):
        super(CAM, self).__init__()
        self.inplanes = inplanes
        self.bn_d = bn_d
        self.pool = nn.MaxPool2d(7, 1, 3)
        self.squeeze = nn.Conv2d(inplanes, inplanes // 16,
                                 kernel_size=1, stride=1)
        self.squeeze_bn = nn.BatchNorm2d(inplanes // 16, momentum=self.bn_d)
        self.relu = nn.ReLU(inplace=True)
        self.unsqueeze = nn.Conv2d(inplanes // 16, inplanes,
                                   kernel_size=1, stride=1)
        self.unsqueeze_bn = nn.BatchNorm2d(inplanes, momentum=self.bn_d)
        self.sigmoid = nn.Sigmoid()

    def forward(self, x):
        # 7x7 pooling
        y = self.pool(x)
        # squeezing and relu
        y = self.relu(self.squeeze_bn(self.squeeze(y)))
        # unsqueezing
        y = self.sigmoid(self.unsqueeze_bn(self.unsqueeze(y)))
        # attention
        return y * x

# ******************************************************************************


class Backbone(nn.Module):
    """
       Class for Squeezeseg. Subclasses PyTorch's own "nn" module
    """

    def __init__(self, params):
        # Call the super constructor
        super(Backbone, self).__init__()
        print("Using SqueezeNet Backbone")
        self.use_range = params["input_depth"]["range"]
        self.use_xyz = params["input_depth"]["xyz"]
        self.use_remission = params["input_depth"]["remission"]
        self.bn_d = params["bn_d"]
        self.drop_prob = params["dropout"]

        # input depth calc
        self.input_depth = 0
        self.input_idxs = []
        if self.use_range:
            self.input_depth += 1
            self.input_idxs.append(0)
        if self.use_xyz:
            self.input_depth += 3
            self.input_idxs.extend([1, 2, 3])
        if self.use_remission:
            self.input_depth += 1
            self.input_idxs.append(4)
        print("Depth of backbone input = ", self.input_depth)

        # stride play
        self.strides = [2, 2, 2, 2]

        # encoder
        self.conv1a = nn.Sequential(nn.Conv2d(self.input_depth, 32, kernel_size=3,
                                              stride=[1, self.strides[0]],
                                              padding=1),
                                    nn.BatchNorm2d(32, momentum=self.bn_d),
                                    nn.ReLU(inplace=True),
                                    CAM(32, bn_d=self.bn_d))
        self.conv1b = nn.Sequential(nn.Conv2d(32, 64, kernel_size=3,
                                              stride=[1, 2],
                                              padding=1),
                                    nn.BatchNorm2d(64, momentum=self.bn_d),
                                    nn.ReLU(inplace=True),
                                    CAM(64, bn_d=self.bn_d))
        self.fire23 = nn.Sequential(nn.MaxPool2d(kernel_size=3,
                                                 stride=[1, self.strides[1]],
                                                 padding=1),
                                    Fire(64, 16, 64, 64, bn_d=self.bn_d),
                                    CAM(128, bn_d=self.bn_d),
                                    Fire(128, 16, 64, 64, bn_d=self.bn_d),
                                    CAM(128, bn_d=self.bn_d))
        self.fire45 = nn.Sequential(nn.MaxPool2d(kernel_size=3,
                                                 stride=[1, self.strides[2]],
                                                 padding=1),
                                    Fire(128, 32, 128, 128, bn_d=self.bn_d),
                                    Fire(256, 32, 128, 128, bn_d=self.bn_d))
        self.fire6789 = nn.Sequential(nn.MaxPool2d(kernel_size=3,
                                                   stride=[1, self.strides[3]],
                                                   padding=1),
                                      Fire(256, 48, 192, 192, bn_d=self.bn_d),
                                      Fire(384, 48, 192, 192, bn_d=self.bn_d),
                                      Fire(384, 64, 256, 256, bn_d=self.bn_d),
                                      Fire(512, 64, 256, 256, bn_d=self.bn_d))

        # output
        self.dropout = nn.Dropout2d(self.drop_prob)

        # last channels
        self.last_channels = 512

    def run_layer(self, x, layer):
        y = layer(x)
        x = y
        return x

    def forward(self, x):
        # filter input
        x = x[:, self.input_idxs]

        # run cnn
        x = self.conv1a(x)
        x = self.conv1b(x)

        x = self.run_layer(x, self.fire23)
        x = self.run_layer(x, self.dropout)
        x = self.run_layer(x, self.fire45)
        x = self.run_layer(x, self.dropout)
        x = self.run_layer(x, self.fire6789)
        x = self.run_layer(x, self.dropout)
        return x

    def get_last_depth(self):
        return self.last_channels

    def get_input_depth(self):
        return self.input_depth